├── .github
    ├── ISSUE_TEMPLATE
    │   ├── bug.yml
    │   └── feature-request.yml
    ├── PULL_REQUEST_TEMPLATE.md
    ├── scripts
    │   ├── check_copyright_header.py
    │   ├── markdown_link_check_config.json
    │   ├── spellcheck.sh
    │   └── spellcheck_conf
    │   │   ├── spellcheck.yaml
    │   │   └── wordlist.txt
    └── workflows
    │   ├── pytest_cpu_gha_runner.yaml
    │   └── spellcheck.yml
├── .gitignore
├── 3p-integrations
    ├── README.md
    ├── aws
    │   ├── getting_started_llama_3_on_amazon_bedrock.ipynb
    │   ├── prompt_engineering_with_llama_2_on_amazon_bedrock.ipynb
    │   └── react_llama_3_bedrock_wk.ipynb
    ├── azure
    │   ├── Azure MaaS
    │   │   └── azure_api_example.ipynb
    │   └── README.md
    ├── crusoe
    │   ├── README.md
    │   └── vllm-fp8
    │   │   ├── README.md
    │   │   ├── assets
    │   │       ├── tpot_vs_qps_chart.png
    │   │       └── ttft_vs_qps_chart.png
    │   │   ├── benchmarks
    │   │       ├── backend_request_func.py
    │   │       ├── benchmark_serving.py
    │   │       └── sonnet.txt
    │   │   ├── convert_hf_to_fp8.py
    │   │   ├── main.tf
    │   │   ├── plot.py
    │   │   ├── pyproject.toml
    │   │   └── run_benchmark.sh
    ├── e2b-ai-analyst
    │   └── README.md
    ├── groq
    │   ├── groq-api-cookbook
    │   │   ├── function-calling-101-ecommerce
    │   │   │   ├── Function-Calling-101-Ecommerce.ipynb
    │   │   │   ├── customers.csv
    │   │   │   ├── orders.csv
    │   │   │   └── products.csv
    │   │   ├── json-mode-function-calling-for-sql
    │   │   │   ├── data
    │   │   │   │   ├── employees.csv
    │   │   │   │   └── purchases.csv
    │   │   │   ├── json-mode-function-calling-for-sql.ipynb
    │   │   │   └── verified-queries
    │   │   │   │   ├── employees-without-purchases.yaml
    │   │   │   │   ├── most-expensive-purchase.yaml
    │   │   │   │   ├── most-recent-purchases.yaml
    │   │   │   │   └── number-of-teslas.yaml
    │   │   ├── json-mode-social-determinants-of-health
    │   │   │   ├── SDOH-Json-mode.ipynb
    │   │   │   └── clinical_notes
    │   │   │   │   ├── 00456321.txt
    │   │   │   │   ├── 00567289.txt
    │   │   │   │   ├── 00678934.txt
    │   │   │   │   ├── 00785642.txt
    │   │   │   │   └── 00893247.txt
    │   │   ├── llama3-stock-market-function-calling
    │   │   │   └── llama3-stock-market-function-calling.ipynb
    │   │   ├── parallel-tool-use
    │   │   │   ├── parallel-tool-use.ipynb
    │   │   │   └── requirements.txt
    │   │   └── rag-langchain-presidential-speeches
    │   │   │   ├── presidential_speeches.csv
    │   │   │   └── rag-langchain-presidential-speeches.ipynb
    │   ├── groq-example-templates
    │   │   ├── conversational-chatbot-langchain
    │   │   │   ├── README.md
    │   │   │   ├── main.py
    │   │   │   └── requirements.txt
    │   │   ├── crewai-agents
    │   │   │   ├── README.md
    │   │   │   ├── main.py
    │   │   │   └── requirements.txt
    │   │   ├── groq-quickstart-conversational-chatbot
    │   │   │   ├── README.md
    │   │   │   ├── main.py
    │   │   │   └── requirements.txt
    │   │   ├── groqing-the-stock-market-function-calling-llama3
    │   │   │   ├── README.md
    │   │   │   ├── main.py
    │   │   │   └── requirements.txt
    │   │   ├── llamachat-conversational-chatbot-with-llamaIndex
    │   │   │   ├── README.md
    │   │   │   ├── main.py
    │   │   │   └── requirements.txt
    │   │   ├── presidential-speeches-rag-with-pinecone
    │   │   │   ├── README.md
    │   │   │   ├── main.py
    │   │   │   └── requirements.txt
    │   │   ├── text-to-sql-json-mode
    │   │   │   ├── README.md
    │   │   │   ├── data
    │   │   │   │   ├── employees.csv
    │   │   │   │   └── purchases.csv
    │   │   │   ├── main.py
    │   │   │   ├── prompts
    │   │   │   │   └── base_prompt.txt
    │   │   │   └── requirements.txt
    │   │   └── verified-sql-function-calling
    │   │   │   ├── README.md
    │   │   │   ├── data
    │   │   │       ├── employees.csv
    │   │   │       └── purchases.csv
    │   │   │   ├── main.py
    │   │   │   ├── requirements.txt
    │   │   │   └── verified-queries
    │   │   │       ├── employees-without-purchases.yaml
    │   │   │       ├── most-expensive-purchase.yaml
    │   │   │       ├── most-recent-purchases.yaml
    │   │   │       └── number-of-teslas.yaml
    │   └── llama3_cookbook_groq.ipynb
    ├── lamini
    │   └── text2sql_memory_tuning
    │   │   ├── README.md
    │   │   ├── assets
    │   │       ├── manual_filtering.png
    │   │       └── website.png
    │   │   ├── data
    │   │       ├── gold-test-set-v2.jsonl
    │   │       ├── gold-test-set.jsonl
    │   │       └── training_data
    │   │       │   ├── archive
    │   │       │       ├── generated_queries_large_filtered_cleaned.jsonl
    │   │       │       └── generated_queries_v2_large_filtered_cleaned.jsonl
    │   │       │   ├── generated_queries.jsonl
    │   │       │   ├── generated_queries_large.jsonl
    │   │       │   ├── generated_queries_large_filtered.jsonl
    │   │       │   ├── generated_queries_v2.jsonl
    │   │       │   ├── generated_queries_v2_large.jsonl
    │   │       │   └── generated_queries_v2_large_filtered.jsonl
    │   │   ├── meta_lamini.ipynb
    │   │   ├── nba_roster.db
    │   │   └── util
    │   │       ├── get_default_finetune_args.py
    │   │       ├── get_rubric.py
    │   │       ├── get_schema.py
    │   │       ├── load_dataset.py
    │   │       ├── make_llama_3_prompt.py
    │   │       ├── parse_arguments.py
    │   │       └── setup_logging.py
    ├── langchain
    │   ├── README.md
    │   ├── langgraph_rag_agent.ipynb
    │   ├── langgraph_rag_agent_local.ipynb
    │   └── langgraph_tool_calling_agent.ipynb
    ├── llama_on_prem.md
    ├── llamaindex
    │   ├── dlai_agentic_rag
    │   │   ├── Building_Agentic_RAG_with_Llamaindex_L2_Tool_Calling.ipynb
    │   │   ├── Building_Agentic_RAG_with_Llamaindex_L3_Building_an_Agent_Reasoning_Loop.ipynb
    │   │   ├── Building_Agentic_RAG_with_Llamaindex_L4_Building_a_Multi-Document_Agent.ipynb
    │   │   └── README.md
    │   └── llamaindex_cookbook.ipynb
    ├── modal
    │   └── many-llamas-human-eval
    │   │   ├── README.md
    │   │   ├── download.py
    │   │   ├── eval.py
    │   │   ├── generate.py
    │   │   ├── inference.py
    │   │   ├── plot.py
    │   │   └── run_e2e.sh
    ├── tgi
    │   ├── README.md
    │   └── merge_lora_weights.py
    ├── togetherai
    │   ├── README.md
    │   ├── datasets
    │   │   └── movies.json
    │   ├── images
    │   │   ├── BERTScore.png
    │   │   ├── CoQA.png
    │   │   ├── ColPaliMaxSim-1.png
    │   │   ├── Nvidia_collage.png
    │   │   ├── UMAP.png
    │   │   ├── cRAG.png
    │   │   ├── cRAG_indexing.png
    │   │   ├── cRAG_querytime.png
    │   │   ├── cluster.png
    │   │   ├── colpali_arch.png
    │   │   ├── conversation.png
    │   │   ├── deploy_CFT.png
    │   │   ├── ft_model.png
    │   │   ├── mmrag_only.png
    │   │   ├── page_25.png
    │   │   ├── repetition_task.png
    │   │   ├── reranking.png
    │   │   ├── semantic_search.png
    │   │   ├── simple_RAG.png
    │   │   ├── structured_text_image.png
    │   │   ├── summarization.png
    │   │   ├── summary_task.png
    │   │   ├── text_RAG.png
    │   │   ├── together-color.jpg
    │   │   ├── together.gif
    │   │   └── wandb_model.png
    │   ├── knowledge_graphs_with_structured_outputs.ipynb
    │   ├── llama_contextual_RAG.ipynb
    │   ├── multimodal_RAG_with_nvidia_investor_slide_deck.ipynb
    │   ├── pdf_to_podcast_using_llama_on_together.ipynb
    │   ├── structured_text_extraction_from_images.ipynb
    │   └── text_RAG_using_llama_on_together.ipynb
    ├── using_externally_hosted_llms.ipynb
    └── vllm
    │   ├── README.md
    │   └── inference.py
├── CODE_OF_CONDUCT.md
├── CONTRIBUTING.md
├── LICENSE
├── README.md
├── UPDATES.md
├── dev_requirements.txt
├── end-to-end-use-cases
    ├── ArticleSummarizer
    │   ├── .gitignore
    │   ├── README.md
    │   ├── app
    │   │   ├── .gitignore
    │   │   ├── build.gradle.kts
    │   │   ├── proguard-rules.pro
    │   │   └── src
    │   │   │   └── main
    │   │   │       ├── AndroidManifest.xml
    │   │   │       ├── java
    │   │   │           └── com
    │   │   │           │   └── example
    │   │   │           │       └── llamaandroiddemo
    │   │   │           │           ├── AppLog.java
    │   │   │           │           ├── AppLogging.java
    │   │   │           │           ├── AppUtils.java
    │   │   │           │           ├── DemoSharedPreferences.java
    │   │   │           │           ├── ExampleLlamaRemoteInference.kt
    │   │   │           │           ├── HomescreenActivity.kt
    │   │   │           │           ├── LanguageSelector.java
    │   │   │           │           ├── LogsActivity.java
    │   │   │           │           ├── LogsAdapter.java
    │   │   │           │           ├── MainActivity.java
    │   │   │           │           ├── Message.java
    │   │   │           │           ├── MessageAdapter.java
    │   │   │           │           ├── MessageType.java
    │   │   │           │           ├── ModelType.java
    │   │   │           │           ├── ModelUtils.java
    │   │   │           │           ├── PromptFormat.java
    │   │   │           │           ├── SettingsActivity.java
    │   │   │           │           └── SettingsFields.java
    │   │   │       └── res
    │   │   │           ├── drawable
    │   │   │               ├── banner_shape.xml
    │   │   │               ├── baseline_add_24.xml
    │   │   │               ├── baseline_add_photo_alternate_24.xml
    │   │   │               ├── baseline_article_24.xml
    │   │   │               ├── baseline_close_24.xml
    │   │   │               ├── baseline_delete_forever_24.xml
    │   │   │               ├── baseline_language_24.xml
    │   │   │               ├── baseline_restart_alt_24.xml
    │   │   │               ├── baseline_send_24.xml
    │   │   │               ├── baseline_settings_24.xml
    │   │   │               ├── baseline_stop_24.xml
    │   │   │               ├── btn.xml
    │   │   │               ├── chat_background.xml
    │   │   │               ├── custom_button_round.xml
    │   │   │               ├── expand_circle_down.xml
    │   │   │               ├── ic_launcher_background.xml
    │   │   │               ├── ic_launcher_foreground.xml
    │   │   │               ├── input_text_shape.xml
    │   │   │               ├── outline_add_box_48.xml
    │   │   │               ├── outline_camera_alt_48.xml
    │   │   │               ├── outline_image_48.xml
    │   │   │               ├── prompt_shape.xml
    │   │   │               ├── received_message.xml
    │   │   │               ├── sent_message.xml
    │   │   │               ├── summarizer.png
    │   │   │               └── three_dots.xml
    │   │   │           ├── layout
    │   │   │               ├── activity_benchmarking.xml
    │   │   │               ├── activity_homescreen.xml
    │   │   │               ├── activity_logs.xml
    │   │   │               ├── activity_main.xml
    │   │   │               ├── activity_settings.xml
    │   │   │               ├── logs_message.xml
    │   │   │               ├── received_message.xml
    │   │   │               ├── sent_message.xml
    │   │   │               └── system_message.xml
    │   │   │           ├── mipmap-anydpi-v26
    │   │   │               ├── ic_launcher.xml
    │   │   │               └── ic_launcher_round.xml
    │   │   │           ├── mipmap-hdpi
    │   │   │               ├── ic_launcher.webp
    │   │   │               └── ic_launcher_round.webp
    │   │   │           ├── mipmap-mdpi
    │   │   │               ├── ic_launcher.webp
    │   │   │               └── ic_launcher_round.webp
    │   │   │           ├── mipmap-xhdpi
    │   │   │               ├── ic_launcher.webp
    │   │   │               └── ic_launcher_round.webp
    │   │   │           ├── mipmap-xxhdpi
    │   │   │               ├── ic_launcher.webp
    │   │   │               └── ic_launcher_round.webp
    │   │   │           ├── mipmap-xxxhdpi
    │   │   │               ├── ic_launcher.webp
    │   │   │               └── ic_launcher_round.webp
    │   │   │           ├── values
    │   │   │               ├── colors.xml
    │   │   │               ├── strings.xml
    │   │   │               ├── styles.xml
    │   │   │               └── themes.xml
    │   │   │           └── xml
    │   │   │               ├── backup_rules.xml
    │   │   │               ├── data_extraction_rules.xml
    │   │   │               └── file_paths.xml
    │   ├── build.gradle.kts
    │   ├── gradle.properties
    │   ├── gradle
    │   │   └── wrapper
    │   │   │   └── gradle-wrapper.properties
    │   ├── gradlew
    │   ├── gradlew.bat
    │   ├── screenshot.png
    │   └── settings.gradle.kts
    ├── Contextual-Chunking-RAG
    │   ├── Example_FinancialReport_RAG.ipynb
    │   ├── README.md
    │   ├── Tutorial.ipynb
    │   ├── config.py
    │   ├── data
    │   │   └── llama_article.txt
    │   ├── embedding.py
    │   └── helper.py
    ├── Multi-Modal-RAG
    │   ├── README.md
    │   ├── notebooks
    │   │   ├── Part_1_Data_Preparation.ipynb
    │   │   ├── Part_2_Cleaning_Data_and_DB.ipynb
    │   │   └── Part_3_RAG_Setup_and_Validation.ipynb
    │   └── scripts
    │   │   ├── final_demo.py
    │   │   └── label_script.py
    ├── NotebookLlama
    │   ├── README.md
    │   ├── Step-1 PDF-Pre-Processing-Logic.ipynb
    │   ├── Step-2-Transcript-Writer.ipynb
    │   ├── Step-3-Re-Writer.ipynb
    │   ├── Step-4-TTS-Workflow.ipynb
    │   ├── TTS_Notes.md
    │   ├── requirements.txt
    │   └── resources
    │   │   ├── 2402.13116v4.pdf
    │   │   ├── Outline.jpg
    │   │   ├── _podcast.mp3
    │   │   ├── clean_extracted_text.txt
    │   │   ├── data.pkl
    │   │   └── podcast_ready_data.pkl
    ├── RAFT-Chatbot
    │   ├── README.md
    │   ├── config.py
    │   ├── eval_llama.json
    │   ├── format.py
    │   ├── images
    │   │   ├── Answers_Precision.png
    │   │   ├── LLM_score_comparison.png
    │   │   ├── Num_of_refusal_comparison.png
    │   │   └── RAFT.png
    │   ├── raft.py
    │   ├── raft.yaml
    │   ├── raft_eval.py
    │   ├── raft_eval_config.yaml
    │   └── raft_utils.py
    ├── README.md
    ├── agents
    │   ├── Agents_Tutorial
    │   │   ├── Tool_Calling_101.ipynb
    │   │   └── Tool_Calling_201.ipynb
    │   ├── DeepLearningai_Course_Notebooks
    │   │   ├── AI_Agentic_Design_Patterns_with_AutoGen_L4_Tool_Use_and_Conversational_Chess.ipynb
    │   │   ├── AI_Agents_in_LangGraph_L1_Build_an_Agent_from_Scratch.ipynb
    │   │   ├── Building_Agentic_RAG_with_Llamaindex_L1_Router_Engine.ipynb
    │   │   ├── Functions_Tools_and_Agents_with_LangChain_L1_Function_Calling.ipynb
    │   │   └── README.md
    │   ├── README.md
    │   └── calendar_assistant
    │   │   ├── README.md
    │   │   ├── assets
    │   │       ├── flow_diagram.png
    │   │       └── google_calendar.png
    │   │   └── tool_calling_google_api.ipynb
    ├── benchmarks
    │   ├── README.md
    │   ├── evals_synthetic_data
    │   │   ├── README.md
    │   │   ├── Workflow_Diagram.png
    │   │   ├── evals_with_synthetic_data.ipynb
    │   │   └── generated_data
    │   │   │   ├── data_0.json
    │   │   │   ├── data_1.json
    │   │   │   ├── data_10.json
    │   │   │   ├── data_11.json
    │   │   │   ├── data_2.json
    │   │   │   ├── data_3.json
    │   │   │   ├── data_4.json
    │   │   │   ├── data_5.json
    │   │   │   ├── data_6.json
    │   │   │   ├── data_7.json
    │   │   │   ├── data_8.json
    │   │   │   ├── data_9.json
    │   │   │   └── tabular_data.csv
    │   ├── inference
    │   │   ├── README.md
    │   │   ├── cloud
    │   │   │   ├── README.md
    │   │   │   ├── aws
    │   │   │   │   └── fmbench
    │   │   │   │   │   ├── README.md
    │   │   │   │   │   ├── config.yml
    │   │   │   │   │   └── img
    │   │   │   │   │       ├── CFT.png
    │   │   │   │   │       ├── business_summary.png
    │   │   │   │   │       ├── instances.png
    │   │   │   │   │       └── latency_vs_tokens.png
    │   │   │   └── azure
    │   │   │   │   ├── chat_azure_api_benchmark.py
    │   │   │   │   ├── input.jsonl
    │   │   │   │   ├── parameters.json
    │   │   │   │   └── pretrained_azure_api_benchmark.py
    │   │   ├── on_prem
    │   │   │   ├── README.md
    │   │   │   └── vllm
    │   │   │   │   ├── chat_vllm_benchmark.py
    │   │   │   │   ├── input.jsonl
    │   │   │   │   ├── parameters.json
    │   │   │   │   └── pretrained_vllm_benchmark.py
    │   │   └── requirements.txt
    │   └── llm_eval_harness
    │   │   ├── README.md
    │   │   └── meta_eval
    │   │       ├── README.md
    │   │       ├── eval_config.yaml
    │   │       ├── meta_template
    │   │           ├── bbh
    │   │           │   ├── bbh_3shot_cot.yaml
    │   │           │   └── utils.py
    │   │           ├── gpqa
    │   │           │   ├── gpqa_0shot.yaml
    │   │           │   └── utils.py
    │   │           ├── gpqa_cot
    │   │           │   ├── gpqa_0shot_cot.yaml
    │   │           │   └── utils.py
    │   │           ├── ifeval
    │   │           │   ├── ifeval.yaml
    │   │           │   └── utils.py
    │   │           ├── math_hard
    │   │           │   ├── math_4shot_cot.yaml
    │   │           │   ├── math_hard_0shot_cot.yaml
    │   │           │   └── utils.py
    │   │           ├── meta_instruct.yaml
    │   │           ├── meta_pretrain.yaml
    │   │           ├── mmlu
    │   │           │   ├── mmlu_instruct.yaml
    │   │           │   ├── mmlu_pretrain.yaml
    │   │           │   └── utils.py
    │   │           └── mmlu_pro
    │   │           │   ├── mmlu_pro_5shot_cot_instruct.yaml
    │   │           │   ├── mmlu_pro_5shot_cot_pretrain.yaml
    │   │           │   └── utils.py
    │   │       └── prepare_meta_eval.py
    ├── book-character-mindmap
    │   ├── .gitignore
    │   ├── README.md
    │   ├── package-lock.json
    │   ├── package.json
    │   ├── public
    │   │   ├── character_relationship.png
    │   │   ├── chat_interface.png
    │   │   ├── favicon.ico
    │   │   ├── index.html
    │   │   ├── logo192.png
    │   │   ├── logo512.png
    │   │   ├── manifest.json
    │   │   ├── mindmap.png
    │   │   └── robots.txt
    │   ├── server
    │   │   ├── requirements.txt
    │   │   └── server.py
    │   ├── src
    │   │   ├── App.css
    │   │   ├── App.js
    │   │   ├── App.test.js
    │   │   ├── approuter.jsx
    │   │   ├── index.css
    │   │   ├── index.js
    │   │   ├── logo.svg
    │   │   ├── pages
    │   │   │   ├── Layout.jsx
    │   │   │   ├── bookPage
    │   │   │   │   ├── components
    │   │   │   │   │   ├── CharacterGraph.jsx
    │   │   │   │   │   ├── ChatInterface.jsx
    │   │   │   │   │   └── ErrorBoundary.jsx
    │   │   │   │   └── index.jsx
    │   │   │   └── homePage
    │   │   │   │   ├── components
    │   │   │   │       ├── Features.jsx
    │   │   │   │       ├── Hero.jsx
    │   │   │   │       └── HowItWorks.jsx
    │   │   │   │   └── index.jsx
    │   │   ├── reportWebVitals.js
    │   │   └── setupTests.js
    │   └── tailwind.config.js
    ├── browser_use
    │   ├── README.md
    │   └── agent
    │   │   ├── browser-use-quickstart.ipynb
    │   │   └── sample_screenshot.png
    ├── coding
    │   └── text2sql
    │   │   ├── README.md
    │   │   ├── csv2db.py
    │   │   ├── nba.txt
    │   │   ├── nba_roster.db
    │   │   ├── quickstart.ipynb
    │   │   ├── requirements.txt
    │   │   └── txt2csv.py
    ├── customerservice_chatbots
    │   ├── RAG_chatbot
    │   │   ├── RAG_Chatbot_Example.ipynb
    │   │   ├── data
    │   │   │   └── Llama Getting Started Guide.pdf
    │   │   ├── requirements.txt
    │   │   └── vectorstore
    │   │   │   ├── db_faiss
    │   │   │       ├── index.faiss
    │   │   │       └── index.pkl
    │   │   │   └── mongodb
    │   │   │       └── rag_mongodb_llama3_huggingface_open_source.ipynb
    │   ├── README.md
    │   ├── messenger_chatbot
    │   │   ├── llama_messenger.py
    │   │   └── messenger_llama3.md
    │   └── whatsapp_chatbot
    │   │   ├── llama_chatbot.py
    │   │   └── whatsapp_llama3.md
    ├── email_agent
    │   ├── 1.png
    │   ├── 2.png
    │   ├── 3.png
    │   ├── README.md
    │   ├── email_agent.png
    │   ├── email_agent.py
    │   ├── functions_prompt.py
    │   ├── main.py
    │   └── requirements.txt
    ├── github_triage
    │   ├── README.md
    │   ├── config.yaml
    │   ├── llm.py
    │   ├── output
    │   │   └── pytorch
    │   │   │   └── pytorch
    │   │   │       └── 2024-08-28_2024-08-28
    │   │   │           ├── annotated_issues.csv
    │   │   │           ├── challenges.csv
    │   │   │           ├── overview.csv
    │   │   │           ├── plots
    │   │   │               ├── commits.png
    │   │   │               ├── engagement_sankey.png
    │   │   │               ├── expertise.png
    │   │   │               ├── sentiment.png
    │   │   │               ├── severity.png
    │   │   │               └── themes.png
    │   │   │           └── report.pdf
    │   ├── pdf_report.py
    │   ├── plots.py
    │   ├── requirements.txt
    │   ├── triage.py
    │   ├── utils.py
    │   └── walkthrough.ipynb
    ├── long_context
    │   └── H2O
    │   │   ├── README.md
    │   │   ├── data
    │   │       └── summarization
    │   │       │   ├── cnn_dailymail.jsonl
    │   │       │   └── xsum.jsonl
    │   │   ├── requirements.txt
    │   │   ├── run_streaming.py
    │   │   ├── run_summarization.py
    │   │   ├── src
    │   │       └── streaming.sh
    │   │   └── utils
    │   │       ├── cache.py
    │   │       ├── llama.py
    │   │       └── streaming.py
    ├── multilingual
    │   ├── README.md
    │   ├── extend_tokenizer.py
    │   ├── img
    │   │   ├── phase1_eval_loss.png
    │   │   ├── phase1_train_loss.png
    │   │   ├── phase2_eval_loss.png
    │   │   └── phase2_train_loss.png
    │   ├── prepare_data.py
    │   └── train_tokenizer.py
    ├── research_paper_analyzer
    │   ├── README.md
    │   ├── requirements.txt
    │   └── research_analyzer.py
    ├── video_summary.ipynb
    └── whatsapp_llama_4_bot
    │   ├── .env
    │   ├── README.md
    │   ├── ec2_endpoints.py
    │   ├── ec2_services.py
    │   ├── requirements.txt
    │   ├── webhook_main.py
    │   └── webhook_utils.py
├── getting-started
    ├── RAG
    │   └── hello_llama_cloud.ipynb
    ├── README.md
    ├── build_with_llama_4.ipynb
    ├── build_with_llama_api.ipynb
    ├── finetuning
    │   ├── LLM_finetuning_overview.md
    │   ├── README.md
    │   ├── datasets
    │   │   ├── README.md
    │   │   ├── custom_dataset.py
    │   │   ├── ocrvqa_dataset.py
    │   │   └── raft_dataset.py
    │   ├── finetune_llama4.md
    │   ├── finetune_vision_model.md
    │   ├── finetuning.py
    │   ├── multi_node.slurm
    │   ├── multigpu_finetuning.md
    │   ├── quickstart_peft_finetuning.ipynb
    │   └── singlegpu_finetuning.md
    ├── inference
    │   ├── README.md
    │   ├── api_inference
    │   │   ├── README.md
    │   │   ├── api_inference.py
    │   │   └── llama_inference_api.ipynb
    │   └── local_inference
    │   │   ├── README.md
    │   │   ├── chat_completion
    │   │       ├── chat_completion.py
    │   │       └── chats.json
    │   │   ├── inference.py
    │   │   ├── multi_modal_infer.py
    │   │   └── samsum_prompt.txt
    ├── llama-tools
    │   └── llama-prompt-ops_101.ipynb
    └── responsible_ai
    │   ├── README.md
    │   ├── code_shield_usage_demo.ipynb
    │   ├── llama_guard
    │       ├── README.md
    │       ├── __init__.py
    │       ├── llama_guard_customization_via_prompting_and_fine_tuning.ipynb
    │       ├── llama_guard_finetuning_multiple_violations_with_torchtune.ipynb
    │       ├── llama_guard_text_and_vision_inference.ipynb
    │       ├── resources
    │       │   ├── dog.jpg
    │       │   └── pasta.jpeg
    │       └── torchtune_configs
    │       │   ├── 8B_guard_full.yaml
    │       │   └── custom_template.py
    │   └── prompt_guard
    │       ├── README.md
    │       ├── __init__.py
    │       ├── inference.py
    │       ├── prompt_guard_1_inference.py
    │       └── prompt_guard_tutorial.ipynb
├── pyproject.toml
├── requirements.txt
└── src
    ├── README.md
    ├── docs
        ├── FAQ.md
        ├── LLM_finetuning.md
        ├── img
        │   ├── WhatApp_Llama4_integration.jpeg
        │   ├── a_colorful_llama_doing_ai_programming.jpeg
        │   ├── a_llama_dressed_as_a_professional_mountain.jpeg
        │   ├── cat.jpeg
        │   ├── feature_based_fn.png
        │   ├── feature_based_fn_2.png
        │   ├── full_param_fn.png
        │   ├── gnocchi_alla_romana.jpeg
        │   ├── grocery_shopping_bascket_with_salmon_in_package.jpeg
        │   ├── k1.jpg
        │   ├── k1_resized.jpg
        │   ├── k2.jpg
        │   ├── k2_resized.jpg
        │   ├── k3.jpg
        │   ├── k3_resized.jpg
        │   ├── k4.jpg
        │   ├── k4_resized.jpg
        │   ├── llama-mobile-confirmed.png
        │   ├── llama-recipes.png
        │   ├── llama2_gradio.png
        │   ├── llama2_streamlit.png
        │   ├── llama2_streamlit2.png
        │   ├── llama_stack.png
        │   ├── messenger_api_settings.png
        │   ├── messenger_llama_arch.jpg
        │   ├── meta_release.png
        │   ├── resized_image.jpg
        │   ├── thumbnail_IMG_1329.jpg
        │   ├── thumbnail_IMG_1440.jpg
        │   ├── thumbnail_IMG_6385.jpg
        │   ├── wandb_screenshot.png
        │   ├── whatsapp_dashboard.jpg
        │   └── whatsapp_llama_arch.jpg
        ├── multi_gpu.md
        └── single_gpu.md
    ├── llama_cookbook
        ├── configs
        │   ├── __init__.py
        │   ├── datasets.py
        │   ├── fsdp.py
        │   ├── peft.py
        │   ├── quantization.py
        │   ├── training.py
        │   └── wandb.py
        ├── data
        │   ├── __init__.py
        │   ├── concatenator.py
        │   ├── llama_guard
        │   │   ├── README.md
        │   │   ├── __init__.py
        │   │   ├── finetuning_data_formatter.py
        │   │   └── finetuning_data_formatter_example.py
        │   └── sampler.py
        ├── datasets
        │   ├── __init__.py
        │   ├── alpaca_dataset.py
        │   ├── custom_dataset.py
        │   ├── grammar_dataset
        │   │   ├── __init__.py
        │   │   ├── grammar_dataset.py
        │   │   └── grammar_dataset_process.ipynb
        │   ├── samsum_dataset.py
        │   └── toxicchat_dataset.py
        ├── finetuning.py
        ├── inference
        │   ├── __init__.py
        │   ├── chat_utils.py
        │   ├── checkpoint_converter_fsdp_hf.py
        │   ├── llm.py
        │   ├── model_utils.py
        │   ├── prompt_format_utils.py
        │   └── safety_utils.py
        ├── model_checkpointing
        │   ├── __init__.py
        │   └── checkpoint_handler.py
        ├── policies
        │   ├── __init__.py
        │   ├── activation_checkpointing_functions.py
        │   ├── anyprecision_optimizer.py
        │   ├── mixed_precision.py
        │   └── wrapping.py
        ├── tools
        │   ├── README.md
        │   ├── compare_llama_weights.py
        │   └── convert_hf_weights_to_llama.py
        └── utils
        │   ├── __init__.py
        │   ├── config_utils.py
        │   ├── dataset_utils.py
        │   ├── flop_utils.py
        │   ├── fsdp_utils.py
        │   ├── memory_utils.py
        │   ├── plot_metrics.py
        │   └── train_utils.py
    └── tests
        ├── conftest.py
        ├── datasets
            ├── test_custom_dataset.py
            ├── test_grammar_datasets.py
            └── test_samsum_datasets.py
        ├── test_batching.py
        ├── test_chat_completion.py
        ├── test_finetuning.py
        ├── test_finetuning_data_formatter.py
        ├── test_sampler.py
        ├── test_train_utils.py
        └── utils.py


/.github/ISSUE_TEMPLATE/feature-request.yml:
--------------------------------------------------------------------------------
 1 | name: 🚀 Feature request
 2 | description: Submit a proposal/request for a new llama-cookbook feature
 3 | 
 4 | body:
 5 | - type: textarea
 6 |   id: feature-pitch
 7 |   attributes:
 8 |     label: 🚀 The feature, motivation and pitch
 9 |     description: >
10 |       A clear and concise description of the feature proposal. Please outline the motivation for the proposal. Is your feature request related to a specific problem? e.g., *"I'm working on X and would like Y to be possible"*. If this is related to another GitHub issue, please link here too.
11 |   validations:
12 |     required: true
13 | 
14 | - type: textarea
15 |   id: alternatives
16 |   attributes:
17 |     label: Alternatives
18 |     description: >
19 |       A description of any alternative solutions or features you've considered, if any.
20 | 
21 | - type: textarea
22 |   id: additional-context
23 |   attributes:
24 |     label: Additional context
25 |     description: >
26 |       Add any other context or screenshots about the feature request.
27 | 
28 | - type: markdown
29 |   attributes:
30 |     value: >
31 |       Thanks for contributing 🎉!


--------------------------------------------------------------------------------
/.github/PULL_REQUEST_TEMPLATE.md:
--------------------------------------------------------------------------------
 1 | # What does this PR do?
 2 | 
 3 | <!--
 4 | Congratulations! You've made it this far! You're not quite done yet though.
 5 | 
 6 | Please include a good title that fully reflects the extent of your awesome contribution.
 7 | 
 8 | Then, please replace this with a description of the change and which issue is fixed (if applicable). Please also include relevant motivation and context. List any dependencies (if any) that are required for this change.
 9 | 
10 | -->
11 | 
12 | <!-- Remove if not applicable -->
13 | 
14 | Fixes # (issue)
15 | 
16 | 
17 | ## Feature/Issue validation/testing
18 | 
19 | Please describe the tests that you ran to verify your changes and relevant result summary. Provide instructions so it can be reproduced.
20 | Please also list any relevant details for your test configuration.
21 | 
22 | - [ ] Test A
23 | Logs for Test A
24 | 
25 | - [ ] Test B
26 | Logs for Test B
27 | 
28 | 
29 | ## Before submitting
30 | - [ ] This PR fixes a typo or improves the docs (you can dismiss the other checks if that's the case).
31 | - [ ] Did you read the [contributor guideline](https://github.com/meta-llama/llama-cookbook/blob/main/CONTRIBUTING.md),
32 |       Pull Request section?
33 | - [ ] Was this discussed/approved via a Github issue? Please add a link
34 |       to it if that's the case.
35 | - [ ] Did you make sure to update the documentation with your changes?  
36 | - [ ] Did you write any new necessary tests?
37 | 
38 | Thanks for contributing 🎉!
39 | 


--------------------------------------------------------------------------------
/.github/scripts/check_copyright_header.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | import re
 5 | from pathlib import Path
 6 | 
 7 | WORK_DIR = Path(__file__).parents[1]
 8 | PATTERN = "(Meta Platforms, Inc. and affiliates)|(Facebook, Inc(\.|,)? and its affiliates)|([0-9]{4}-present(\.|,)? Facebook)|([0-9]{4}(\.|,)? Facebook)"
 9 | 
10 | HEADER = """# Copyright (c) Meta Platforms, Inc. and affiliates.
11 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.\n\n"""
12 | 
13 | #Files in black list must be relative to main repo folder
14 | BLACKLIST = ["tools/benchmarks/llm_eval_harness/open_llm_leaderboard/hellaswag_utils.py"]
15 | 
16 | if __name__ == "__main__":
17 |     for ext in ["*.py", "*.sh"]:
18 |         for file in WORK_DIR.rglob(ext):
19 |             normalized = file.relative_to(WORK_DIR)
20 |             if normalized.as_posix() in BLACKLIST:
21 |                 continue
22 |             
23 |             text = file.read_text()
24 |             if not re.search(PATTERN, text):
25 |                 text = HEADER + text
26 |                 file.write_text(text)
27 |         


--------------------------------------------------------------------------------
/.github/scripts/markdown_link_check_config.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "retryOn429": true,
 3 |   "retryCount": 5,
 4 |   "fallbackRetryDelay": "10s",
 5 |   "httpHeaders": [
 6 |     {
 7 |       "urls": [
 8 |         "https://docs.github.com/",
 9 |         "https://help.github.com/"
10 |       ],
11 |       "headers": {
12 |         "Accept-Encoding": "zstd, br, gzip, deflate"
13 |       }
14 |     }
15 |   ],
16 |   "ignorePatterns": [
17 |     {
18 |       "pattern": "^http(s)?://127.0.0.1.*"
19 |     },
20 |     {
21 |       "pattern": "^http(s)?://localhost.*"
22 |     },
23 |     {
24 |       "pattern": "https://www.intel.com/content/www/us/en/developer/articles/news/llama2.html"
25 |     },
26 |     {
27 |       "pattern": "http(s.?)?:\/\/(www\.)?linkedin\.com\.*"
28 |     },
29 |     {
30 |       "pattern": "http(s?)?:\/\/(www\.)?medium\.com\/.*"
31 |     }
32 |   ]
33 | }
34 | 


--------------------------------------------------------------------------------
/.github/scripts/spellcheck.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 3 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 4 | # Source: https://github.com/pytorch/torchx/blob/main/scripts/spellcheck.sh
 5 | set -ex
 6 | sudo apt-get install aspell
 7 | 
 8 | if [[ -z "$@" ]]; then
 9 |     sources=$(find -name '*.md')
10 | else
11 |     sources=$@
12 | fi
13 | 
14 | sources_arg=""
15 | for src in $sources; do
16 |         sources_arg="${sources_arg} -S $src"
17 | done
18 | 
19 | if [ ! "$sources_arg" ]; then
20 | 	echo "No files to spellcheck"
21 | else
22 | 	pyspelling -c .github/scripts/spellcheck_conf/spellcheck.yaml --name Markdown $sources_arg
23 | fi
24 | 


--------------------------------------------------------------------------------
/.github/scripts/spellcheck_conf/spellcheck.yaml:
--------------------------------------------------------------------------------
 1 | matrix:
 2 | - name: Markdown
 3 |   apsell:
 4 |     lang: en
 5 |     d: en_US
 6 |   dictionary:
 7 |     wordlists:
 8 |     - .github/scripts/spellcheck_conf/wordlist.txt
 9 |     output: .github/scripts/spellcheck_conf/wordlist.dic
10 |     encoding: utf-8
11 |   pipeline:
12 |   - pyspelling.filters.context:
13 |       context_visible_first: true
14 |       delimiters:
15 |       - open: '(?s)^ *(?P<open>`{3,})[a-z0-9]*?$'
16 |         close: '^(?P=open)$'
17 |       - open: ''
18 |         content: 'https?://[-a-zA-Z0-9.]+?\.[a-z]{2,6}[-?=&%.0-9a-zA-Z/_#]*'
19 |         close: ''
20 |   - pyspelling.filters.markdown:
21 |       markdown_extensions:
22 |       - markdown.extensions.extra:
23 | 


--------------------------------------------------------------------------------
/.github/workflows/spellcheck.yml:
--------------------------------------------------------------------------------
 1 | name: SpellCheck
 2 | 
 3 | on:
 4 |   push:
 5 |     branches:
 6 |       - main
 7 |   pull_request:
 8 |     branches:
 9 |       - main
10 | jobs:
11 |   build:
12 |     runs-on: ubuntu-24.04
13 |     name: Lint changed files
14 |     steps:
15 |       - uses: actions/checkout@v3
16 |         with:
17 |           fetch-depth: 0  # OR "2" -> To retrieve the preceding commit.
18 | 
19 |       - name: Check links in all markdown files
20 |         uses: gaurav-nelson/github-action-markdown-link-check@1.0.13
21 |         with:
22 |           use-verbose-mode: 'yes'
23 |           config-file: ".github/scripts/markdown_link_check_config.json"
24 | 
25 |       - name: Get changed files
26 |         id: changed-files
27 |         uses: tj-actions/changed-files@v45.0.8
28 |         with:
29 | 
30 |           files: |
31 |             **/*.py
32 | 
33 |   spellcheck:
34 |     runs-on: ubuntu-24.04
35 |     steps:
36 |       - uses: actions/checkout@v3
37 | 
38 |       - name: Install dependencies
39 |         run: |
40 |           sudo apt-get install aspell aspell-en
41 |           pip install pyspelling
42 | 
43 |       - name: Get changed files
44 |         id: changed-files
45 |         uses: tj-actions/changed-files@v45.0.8
46 |         with:
47 |           files: |
48 |             **/*.md
49 | 
50 |       - name: Check spellings
51 |         run: |
52 |           sources=""
53 |           for file in ${{ steps.changed-files.outputs.all_changed_files }}; do
54 |             sources="${sources} -S $file"
55 |           done
56 |           if [ ! "$sources" ]; then
57 |             echo "No files to spellcheck"
58 |           else
59 |             pyspelling -c $GITHUB_WORKSPACE/.github/scripts/spellcheck_conf/spellcheck.yaml --name Markdown $sources
60 |           fi
61 | 
62 |       - name: In the case of misspellings
63 |         if: ${{ failure() }}
64 |         run: |
65 |           echo "Please fix the misspellings. If you are sure about some of them, "
66 |           echo "so append those to .github/scripts/spellcheck_conf/wordlist.txt"
67 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
1 | .DS_Store
2 | __pycache__
3 | .ipynb_checkpoints
4 | wandb/
5 | artifacts/
6 | node_modules/
7 | 


--------------------------------------------------------------------------------
/3p-integrations/azure/README.md:
--------------------------------------------------------------------------------
1 | In this folder, we show various recipes for Llama models working with Azure AI services. This includes:
2 | * Examples for running Llama model inference on Azure's serverless API offerings (aka. MaaS)
3 | 


--------------------------------------------------------------------------------
/3p-integrations/crusoe/README.md:
--------------------------------------------------------------------------------
 1 | Below are recipes for deploying common Llama workflows on [Crusoe's](https://crusoe.ai) high-performance, sustainable cloud. Each workflow corresponds to a subfolder with its own README and supplemental materials. Please reference the table below for hardware requirements.
 2 | 
 3 | | Workflow | Model(s) | VM type | Storage |
 4 | |:----:  | :----:  | :----:| :----: |
 5 | | [Serving Llama3.1 in FP8 with vLLM](vllm-fp8/) | [meta-llama/Meta-Llama-3.1-70B-Instruct](https://huggingface.co/meta-llama/Meta-Llama-3.1-70B-Instruct), [meta-llama/Meta-Llama-3.1-8B-Instruct](https://huggingface.co/meta-llama/Meta-Llama-3.1-8B-Instruct) | l40s-48gb.8x | 256 GiB Persistent Disk |
 6 | 
 7 | # Requirements
 8 | First, ensure that you have a Crusoe account (you can sign up [here](https://console.crusoecloud.com/)). We will provision resources using Terraform, please ensure that your environment is configured and refer to the Crusoe [docs](https://github.com/crusoecloud/terraform-provider-crusoe?tab=readme-ov-file#getting-started) for guidance.
 9 | 
10 | # Serving Models
11 | Some recipes in this repo require firewall rules to expose ports in order to reach the inference server. To manage firewall rules, please refer to our [networking documentation](https://docs.crusoecloud.com/networking/firewall-rules/managing-firewall-rules).
12 | 


--------------------------------------------------------------------------------
/3p-integrations/crusoe/vllm-fp8/assets/tpot_vs_qps_chart.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/crusoe/vllm-fp8/assets/tpot_vs_qps_chart.png


--------------------------------------------------------------------------------
/3p-integrations/crusoe/vllm-fp8/assets/ttft_vs_qps_chart.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/crusoe/vllm-fp8/assets/ttft_vs_qps_chart.png


--------------------------------------------------------------------------------
/3p-integrations/crusoe/vllm-fp8/main.tf:
--------------------------------------------------------------------------------
 1 | terraform {
 2 |   required_providers {
 3 |     crusoe = {
 4 |       source = "registry.terraform.io/crusoecloud/crusoe"
 5 |     }
 6 |   }
 7 | }
 8 | 
 9 | locals {
10 |   my_ssh_key = file("~/.ssh/id_ed25519.pub")
11 | }
12 | 
13 | // new VM
14 | resource "crusoe_compute_instance" "vllm_vm" {
15 |   name     = "vllm-example"
16 |   type     = "l40s-48gb.8x"
17 |   location = "us-southcentral1-a"
18 | 
19 |   # specify the base image
20 |   image = "ubuntu22.04-nvidia-slurm:12.4"
21 | 
22 |   disks = [
23 |     {
24 |       id              = crusoe_storage_disk.vllm_data_disk.id
25 |       mode            = "read-write"
26 |       attachment_type = "data"
27 |     }
28 |   ]
29 | 
30 |   ssh_key = local.my_ssh_key
31 | }
32 | 
33 | resource "crusoe_storage_disk" "vllm_data_disk" {
34 |   name     = "vllm-example-disk"
35 |   size     = "256GiB"
36 |   location = "us-southcentral1-a"
37 | }
38 | 
39 | output "instance_public_ip" {
40 |   value = crusoe_compute_instance.vllm_vm.network_interfaces[0].public_ipv4.address
41 | }
42 | 


--------------------------------------------------------------------------------
/3p-integrations/crusoe/vllm-fp8/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [project]
 2 | name = "vllm-l40s"
 3 | version = "0.1.0"
 4 | description = "Add your description here"
 5 | readme = "README.md"
 6 | requires-python = ">=3.10"
 7 | dependencies = [
 8 |     "setuptools>=74.0.0",
 9 |     "vllm>=0.5.5",
10 |     "matplotlib>=3.9.2",
11 |     "llmcompressor>=0.1.0",
12 | ]
13 | 


--------------------------------------------------------------------------------
/3p-integrations/crusoe/vllm-fp8/run_benchmark.sh:
--------------------------------------------------------------------------------
 1 | TOTAL_SECONDS=120
 2 | QPS_RATES=("1" "3" "5" "7" "9")
 3 | 
 4 | for QPS in ${QPS_RATES[@]}; do
 5 |     NUM_PROMPTS=$((TOTAL_SECONDS * QPS))
 6 |     echo "===== RUNNING NUM_PROMPTS = $NUM_PROMPTS QPS = $QPS ====="
 7 | 
 8 |     uv run benchmarks/benchmark_serving.py \
 9 |         --model $MODEL \
10 |         --dataset-name sonnet --sonnet-input-len 550 --sonnet-output-len 150 --dataset-path benchmarks/sonnet.txt \
11 |         --num-prompts $NUM_PROMPTS --request-rate $QPS --save-result
12 | done


--------------------------------------------------------------------------------
/3p-integrations/e2b-ai-analyst/README.md:
--------------------------------------------------------------------------------
 1 | # AI Analyst with Llama and E2B
 2 | This is an AI-powered code and data analysis tool powered by Meta Llama and the [E2B SDK](https://e2b.dev/docs).
 3 | 
 4 | → Try on [ai-analyst.e2b.dev](https://ai-analyst.e2b.dev/)
 5 | 
 6 | ## Features
 7 | - 🔸 Analyze data with Meta's Llama 3.1 and 3.2
 8 | - 🔸 Upload CSV files
 9 | - 🔸 Create interactive charts
10 | 
11 | **Powered by:**
12 | 
13 | - 🔸 ✶ [E2B Sandbox](https://github.com/e2b-dev/code-interpreter)
14 | - 🔸 Vercel's AI SDK
15 | - 🔸 Next.js
16 | - 🔸 echarts library for interactive charts
17 | 
18 | **Supported LLM Providers:**
19 | - 🔸 TogetherAI
20 | - 🔸 Fireworks
21 | - 🔸 Ollama
22 | 
23 | **Supported chart types:**
24 | - 🔸 All the supported charts are described [here](https://e2b.dev/docs/code-interpreting/create-charts-visualizations/interactive-charts#supported-intertactive-charts).
25 | 
26 | 
27 | ## Get started
28 | 
29 | Visit the [online version](https://ai-analyst.e2b.dev/) or run locally on your own.
30 | 
31 | ### 1. Clone repository
32 | ```
33 | git clone https://github.com/e2b-dev/ai-analyst.git
34 | ```
35 | 
36 | ### 2. Install dependencies
37 | ```
38 | cd ai-analyst && npm i
39 | ```
40 | 
41 | ### 3. Add E2B API key
42 | Copy `.example.env` to `.env.local` and fill in `E2B_API_KEY`.
43 | 
44 | - Get your [E2B API key here](https://e2b.dev/dashboard?tab=keys).
45 | 
46 | ### 4. Configure LLM provider
47 | 
48 | In `.env.local`, add an API key for at least one LLM provider:
49 | 
50 | - Fireworks: `FIREWORKS_API_KEY`
51 | - Together AI: `TOGETHER_API_KEY`
52 | 
53 | For Ollama, provide the base URL instead of the API key:
54 | 
55 | - Ollama: `OLLAMA_BASE_URL`
56 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-api-cookbook/function-calling-101-ecommerce/customers.csv:
--------------------------------------------------------------------------------
 1 | customer_id,name,email,address
 2 | 1,Erin Boyle MD,erin.boyle.md@example.com,"165 Brown Springs
 3 | Michaelport, IL 60228"
 4 | 2,Matthew Saunders,matthew.saunders@example.com,"219 Steven Mountains
 5 | Port Gabriellafort, OH 52281"
 6 | 3,Amanda Anderson,amanda.anderson@example.com,"498 Laurie Glens
 7 | Mitchelltown, CT 93655"
 8 | 4,Julian Butler,julian.butler@example.com,"909 Rodriguez Harbors Suite 119
 9 | New Tracyburgh, MS 15487"
10 | 5,Zachary Mitchell MD,zachary.mitchell.md@example.com,"9087 Matthew Drives
11 | Caitlynshire, OR 42442"
12 | 6,Troy Bennett,troy.bennett@example.com,"73329 Kimberly Loaf Apt. 029
13 | Shellyborough, TX 55939"
14 | 7,Allison Hall,allison.hall@example.com,"210 Shannon Camp
15 | New Michael, MO 65990"
16 | 8,Carolyn Davis,carolyn.davis@example.com,"64228 Carol Courts Suite 087
17 | New Micheleshire, MT 42516"
18 | 9,Cindy Munoz,cindy.munoz@example.com,"1722 Christine Plaza
19 | Danielport, UT 12261"
20 | 10,Tom Testuser,tom.testuser@example.com,"451 Victoria Bridge Suite 529
21 | Pageton, WI 27404"
22 | 11,Charles Walker,charles.walker@example.com,"2077 Lamb Drive
23 | Salazarton, IN 54619"
24 | 12,Brianna Molina,brianna.molina@example.com,"586 Khan Mills Suite 202
25 | Lake Dominique, VA 98527"
26 | 13,Austin Andrade,austin.andrade@example.com,"4857 Donna Cliffs
27 | Floydstad, PR 82540"
28 | 14,Brandon Andrade,brandon.andrade@example.com,"906 Olivia Motorway
29 | Kelleyfort, AK 48960"
30 | 15,Diane Lam,diane.lam@example.com,"070 Eric Rapid Suite 159
31 | Townsendbury, MI 57664"
32 | 16,Jason Kelly,jason.kelly@example.com,"873 Angela Track Apt. 972
33 | Stephenville, NV 32705"
34 | 17,Mr. Mitchell Saunders,mr..mitchell.saunders@example.com,"USS White
35 | FPO AE 91058"
36 | 18,Regina Ross,regina.ross@example.com,"91857 Wendy Place
37 | East Charlesshire, CA 43705"
38 | 19,Mrs. Denise May DDS,mrs..denise.may.dds@example.com,"64590 Kathleen Cove Apt. 736
39 | Derrickton, AK 05935"
40 | 20,Lisa Boyle,lisa.boyle@example.com,"USNS Russell
41 | FPO AE 51528"
42 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-api-cookbook/function-calling-101-ecommerce/orders.csv:
--------------------------------------------------------------------------------
 1 | order_id,product_id,customer_id,order_date
 2 | 1,13,18,2024-02-15 15:15
 3 | 2,19,6,2024-01-03 17:43
 4 | 3,12,20,2024-03-11 1:13
 5 | 4,7,20,2024-02-04 12:04
 6 | 5,14,3,2024-05-02 17:12
 7 | 6,17,6,2024-02-12 1:46
 8 | 7,20,4,2024-02-26 2:59
 9 | 8,4,7,2024-05-02 16:51
10 | 9,11,2,2024-01-04 11:09
11 | 10,6,9,2024-04-09 15:04
12 | 11,3,7,2024-02-21 21:17
13 | 12,6,18,2024-02-21 18:50
14 | 13,17,11,2024-05-02 16:20
15 | 14,11,15,2024-04-20 2:49
16 | 15,16,7,2024-01-18 1:12
17 | 16,16,16,2024-05-03 11:20
18 | 17,14,18,2024-03-26 22:51
19 | 18,20,16,2024-05-07 23:25
20 | 19,1,12,2024-05-20 12:41
21 | 20,20,3,2024-01-17 7:25


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-api-cookbook/function-calling-101-ecommerce/products.csv:
--------------------------------------------------------------------------------
 1 | product_id,name,description,price,stock_quantity
 2 | 1,Laptop,High performance laptop with 16GB RAM and 512GB SSD.,753.03,15
 3 | 2,Smartphone,Latest model smartphone with a stunning display and great camera.,398.54,59
 4 | 3,Headphones,Noise-cancelling over-ear headphones with long battery life.,889.79,97
 5 | 4,Monitor,24-inch 1080p monitor with vibrant colors and wide viewing angles.,604.44,98
 6 | 5,Keyboard,Mechanical keyboard with customizable RGB lighting.,500.24,52
 7 | 6,Mouse,Wireless mouse with ergonomic design and long battery life.,321.98,57
 8 | 7,Printer,All-in-one printer with wireless connectivity and high-quality printing.,695.29,32
 9 | 8,Tablet,Portable tablet with 10-inch display and powerful processor.,625.75,28
10 | 9,Smartwatch,Stylish smartwatch with fitness tracking and notifications.,952.72,42
11 | 10,Camera,Digital camera with 20MP sensor and 4K video recording.,247.93,99
12 | 11,Speaker,Bluetooth speaker with excellent sound quality and deep bass.,896.4,32
13 | 12,Router,Wi-Fi router with high speed and wide coverage.,976.16,59
14 | 13,External Hard Drive,1TB external hard drive with fast data transfer speeds.,434.46,18
15 | 14,USB Flash Drive,64GB USB flash drive with compact design and reliable storage.,991.09,77
16 | 15,Microphone,Professional microphone with clear sound and adjustable settings.,276.23,30
17 | 16,Webcam,HD webcam with wide-angle lens and built-in microphone.,890.39,13
18 | 17,Drone,Compact drone with HD camera and stable flight controls.,285.93,37
19 | 18,Projector,Portable projector with bright display and multiple connectivity options.,290.22,31
20 | 19,Fitness Tracker,Fitness tracker with heart rate monitor and sleep tracking.,953.65,4
21 | 20,E-Reader,Lightweight e-reader with high-resolution display and long battery life.,132.15,62
22 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-api-cookbook/json-mode-function-calling-for-sql/data/employees.csv:
--------------------------------------------------------------------------------
1 | employee_id,name,email
2 | 1,Richard Hendricks,richard@piedpiper.com
3 | 2,Erlich Bachman,erlich@aviato.com
4 | 3,Dinesh Chugtai,dinesh@piedpiper.com
5 | 4,Bertram Gilfoyle,gilfoyle@piedpiper.com
6 | 5,Jared Dunn,jared@piedpiper.com
7 | 6,Monica Hall,monica@raviga.com
8 | 7,Gavin Belson,gavin@hooli.com


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-api-cookbook/json-mode-function-calling-for-sql/data/purchases.csv:
--------------------------------------------------------------------------------
1 | purchase_id,purchase_date,product_name,employee_id,amount
2 | 1,'2024-02-01',iPhone,1,750
3 | 2,'2024-02-02',Tesla,2,70000
4 | 3,'2024-02-03',Humane pin,3,500
5 | 4,'2024-02-04',iPhone,4,700
6 | 5,'2024-02-05',Tesla,5,75000


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-api-cookbook/json-mode-function-calling-for-sql/verified-queries/employees-without-purchases.yaml:
--------------------------------------------------------------------------------
1 | description: Employees without a purchase since Feb 1, 2024
2 | sql: |
3 |   SELECT employees.name as employees_without_purchases
4 |   FROM employees.csv AS employees
5 |   LEFT JOIN purchases.csv AS purchases ON employees.employee_id = purchases.employee_id
6 |   AND purchases.purchase_date > '2024-02-01'
7 |   WHERE purchases.purchase_id IS NULL
8 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-api-cookbook/json-mode-function-calling-for-sql/verified-queries/most-expensive-purchase.yaml:
--------------------------------------------------------------------------------
 1 | description: Employee with the most expensive purchase
 2 | sql: |
 3 |   SELECT employees.name AS employee_name,
 4 |         MAX(amount) AS max_purchase_amount
 5 |   FROM purchases.csv AS purchases
 6 |   JOIN employees.csv AS employees ON purchases.employee_id = employees.employee_id
 7 |   GROUP BY employees.name
 8 |   ORDER BY max_purchase_amount DESC
 9 |   LIMIT 1
10 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-api-cookbook/json-mode-function-calling-for-sql/verified-queries/most-recent-purchases.yaml:
--------------------------------------------------------------------------------
 1 | description: Five most recent purchases
 2 | sql: |
 3 |   SELECT 
 4 |          purchases.purchase_date,
 5 |          purchases.product_name,
 6 |          purchases.amount,
 7 |          employees.name
 8 |   FROM purchases.csv AS purchases
 9 |   JOIN employees.csv AS employees ON purchases.employee_id = employees.employee_id
10 |   ORDER BY purchases.purchase_date DESC
11 |   LIMIT 5;
12 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-api-cookbook/json-mode-function-calling-for-sql/verified-queries/number-of-teslas.yaml:
--------------------------------------------------------------------------------
1 | description: Number of Teslas purchased
2 | sql: |
3 |   SELECT COUNT(*) as number_of_teslas
4 |   FROM purchases.csv AS p
5 |   JOIN employees.csv AS e ON e.employee_id = p.employee_id
6 |   WHERE p.product_name = 'Tesla'
7 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-api-cookbook/parallel-tool-use/requirements.txt:
--------------------------------------------------------------------------------
1 | groq
2 | python-dotenv
3 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/conversational-chatbot-langchain/README.md:
--------------------------------------------------------------------------------
 1 | # Groq LangChain Conversational Chatbot
 2 | 
 3 | A simple application that allows users to interact with a conversational chatbot powered by LangChain. The application uses the Groq API to generate responses and leverages LangChain's [ConversationBufferWindowMemory](https://python.langchain.com/v0.1/docs/modules/memory/types/buffer_window/) to maintain a history of the conversation to provide context for the chatbot's responses.
 4 | 
 5 | ## Features
 6 | 
 7 | - **Conversational Interface**: The application provides a conversational interface where users can ask questions or make statements, and the chatbot responds accordingly.
 8 | 
 9 | - **Contextual Responses**: The application maintains a history of the conversation, which is used to provide context for the chatbot's responses.
10 | 
11 | - **LangChain Integration**: The chatbot is powered by the LangChain API, which uses advanced natural language processing techniques to generate human-like responses.
12 | 
13 | ## Usage
14 | 
15 | <!-- markdown-link-check-disable -->
16 | 
17 | You will need to store a valid Groq API Key as a secret to proceed with this example. You can generate one for free [here](https://console.groq.com/keys).
18 | 
19 | <!-- markdown-link-check-enable -->
20 | 
21 | You can [fork and run this application on Replit](https://replit.com/@GroqCloud/Chatbot-with-Conversational-Memory-on-LangChain) or run it on the command line with `python main.py`
22 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/conversational-chatbot-langchain/requirements.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/groq/groq-example-templates/conversational-chatbot-langchain/requirements.txt


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/crewai-agents/README.md:
--------------------------------------------------------------------------------
 1 | # CrewAI Machine Learning Assistant
 2 | 
 3 | ## Overview
 4 | 
 5 | The [CrewAI](https://docs.crewai.com/) Machine Learning Assistant is a command line application designed to kickstart your machine learning projects. It leverages a team of AI agents to guide you through the initial steps of defining, assessing, and solving machine learning problems.
 6 | 
 7 | ## Features
 8 | 
 9 | - **Agents**: Utilizes specialized agents to perform tasks such as problem definition, data assessment, model recommendation, and code generation, enhancing the workflow and efficiency of machine learning projects.
10 | 
11 | - **CrewAI Framework**: Integrates multiple agents into a cohesive framework, enabling seamless interaction and task execution to streamline the machine learning process.
12 | 
13 | - **LangChain Integration**: Incorporates LangChain to facilitate natural language processing and enhance the interaction between the user and the machine learning assistant.
14 | 
15 | ## Usage
16 | 
17 | <!-- markdown-link-check-disable -->
18 | 
19 | You will need to store a valid Groq API Key as a secret to proceed with this example. You can generate one for free [here](https://console.groq.com/keys).
20 | 
21 | <!-- markdown-link-check-enable -->
22 | 
23 | You can [fork and run this application on Replit](https://replit.com/@GroqCloud/CrewAI-Machine-Learning-Assistant) or run it on the command line with `python main.py`. You can upload a sample .csv to the same directory as `main.py` to give the application a head start on your ML problem. The application will output a Markdown file including python code for your ML use case to the same directory as main.py.
24 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/crewai-agents/requirements.txt:
--------------------------------------------------------------------------------
1 | crewai
2 | langchain_groq
3 | pandas


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/groq-quickstart-conversational-chatbot/README.md:
--------------------------------------------------------------------------------
 1 | # Groq Quickstart Conversational Chatbot
 2 | 
 3 | A simple application that allows users to interact with a conversational chatbot powered by Groq. This application is designed to get users up and running quickly with building a chatbot.
 4 | 
 5 | ## Features
 6 | 
 7 | **Conversational Interface**: Provides a simple interface where users can input text and receive responses from the chatbot.
 8 | 
 9 | **Short Responses**: The chatbot replies with very short and concise answers, keeping interactions brief and to the point.
10 | 
11 | **Groq Integration**: Utilizes the Groq API to generate responses, leveraging the power of the Llama3-70b-8192 model.
12 | 
13 | ## Usage
14 | 
15 | <!-- markdown-link-check-disable -->
16 | 
17 | You will need to store a valid Groq API Key as a secret to proceed with this example. You can generate one for free [here](https://console.groq.com/keys).
18 | 
19 | <!-- markdown-link-check-enable -->
20 | 
21 | You can [fork and run this application on Replit](https://replit.com/@GroqCloud/Groq-Quickstart-Conversational-Chatbot) or run it on the command line with `python main.py`.
22 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/groq-quickstart-conversational-chatbot/main.py:
--------------------------------------------------------------------------------
 1 | #set GROQ_API_KEY in the secrets
 2 | 
 3 | import os
 4 | from groq import Groq
 5 | 
 6 | # Create the Groq client
 7 | client = Groq(
 8 |     api_key=os.environ.get("GROQ_API_KEY")
 9 | )
10 | 
11 | # Set the system prompt
12 | system_prompt = {
13 |     "role": "system",
14 |     "content":
15 |     "You are a helpful assistant. You reply with very short answers."
16 | }
17 | 
18 | # Initialize the chat history
19 | chat_history = [system_prompt]
20 | 
21 | while True:
22 |   # Get user input from the console
23 |   user_input = input("You: ")
24 | 
25 |   # Append the user input to the chat history
26 |   chat_history.append({"role": "user", "content": user_input})
27 | 
28 |   response = client.chat.completions.create(model="llama3-70b-8192",
29 |                                             messages=chat_history,
30 |                                             max_tokens=100,
31 |                                             temperature=1.2)
32 |   # Append the response to the chat history
33 |   chat_history.append({
34 |       "role": "assistant",
35 |       "content": response.choices[0].message.content
36 |   })
37 |   # Print the response
38 |   print("Assistant:", response.choices[0].message.content)
39 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/groq-quickstart-conversational-chatbot/requirements.txt:
--------------------------------------------------------------------------------
1 | groq


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/groqing-the-stock-market-function-calling-llama3/requirements.txt:
--------------------------------------------------------------------------------
 1 | streamlit
 2 | pandas
 3 | numpy
 4 | groq
 5 | langchain_community
 6 | langchain_groq
 7 | yfinance
 8 | plotly
 9 | langchain_core
10 | nbformat>=4.2.0
11 | ipython
12 | kaleido


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/llamachat-conversational-chatbot-with-llamaIndex/README.md:
--------------------------------------------------------------------------------
 1 | # LlamaChat: Conversational Chatbot with LlamaIndex and Llama3
 2 | 
 3 | A simple application that allows users to interact with a conversational chatbot powered by the LlamaIndex framework and Meta's Llama3 model. The application uses the Groq API to generate responses and supports different modes of interaction, including simple chat, streaming chat, and customizable chat with system prompts.
 4 | 
 5 | ##Features
 6 | 
 7 | **LlamaIndex**: The application uses LlamaIndex to manage and generate responses, leveraging the power of Groq's language model.
 8 | 
 9 | **Simple Chat**: Generates responses based on user input using the Groq API with LlamaIndex.
10 | 
11 | **Streaming Chat**: Provides real-time streaming responses for user input.
12 | 
13 | **Customizable Chat**: Allows for chat customization by setting a system prompt to guide the chatbot's responses.
14 | 
15 | ##Usage
16 | 
17 | <!-- markdown-link-check-disable -->
18 | 
19 | You will need to store a valid Groq API Key as a secret to proceed with this example. You can generate one for free [here](https://console.groq.com/keys).
20 | 
21 | <!-- markdown-link-check-enable -->
22 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/llamachat-conversational-chatbot-with-llamaIndex/main.py:
--------------------------------------------------------------------------------
 1 | from llama_index.llms.groq import Groq
 2 | from llama_index.core.llms import ChatMessage
 3 | 
 4 | llm = Groq(model="llama3-8b-8192")
 5 | 
 6 | 
 7 | system_prompt = 'You are a friendly but highly sarcastic chatbot assistant'
 8 | 
 9 | while True:
10 |     # Get the user's question
11 |     user_input = input("User: ")
12 | 
13 |     #user_input = 'write a few paragraphs explaining generative AI to a college freshman'
14 | 
15 |     ##################################
16 |     # Simple Chat
17 |     ##################################
18 |     print('Simple Chat:\n\n')
19 |     response = llm.complete(user_input)
20 |     print(response)
21 | 
22 | 
23 |     ##################################
24 |     # Streaming Chat
25 |     ##################################
26 |     stream_response = llm.stream_complete(
27 |         user_input
28 |     )
29 |     print('\n\nStreaming Chat:\n')
30 |     for t in stream_response:
31 |         print(t.delta, end="")
32 | 
33 | 
34 |     ##################################
35 |     # Customizable Chat
36 |     ##################################
37 |     messages = [
38 |         ChatMessage(role="system", content=system_prompt),
39 |         ChatMessage(role="user", content=user_input),
40 |     ]
41 |     print('\n\nChat with System Prompt:\n')
42 |     response_with_system_prompt = llm.chat(messages)
43 | 
44 |     print(response_with_system_prompt)
45 | 
46 | 
47 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/llamachat-conversational-chatbot-with-llamaIndex/requirements.txt:
--------------------------------------------------------------------------------
1 | llama_index
2 | llama-index-llms-groq


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/presidential-speeches-rag-with-pinecone/requirements.txt:
--------------------------------------------------------------------------------
1 | pandas
2 | numpy
3 | groq
4 | langchain_community
5 | langchain_pinecone
6 | transformers
7 | scikit-learn
8 | sentence-transformers


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/text-to-sql-json-mode/data/employees.csv:
--------------------------------------------------------------------------------
1 | employee_id,name,email
2 | 1,Richard Hendricks,richard@piedpiper.com
3 | 2,Erlich Bachman,erlich@aviato.com
4 | 3,Dinesh Chugtai,dinesh@piedpiper.com
5 | 4,Bertram Gilfoyle,gilfoyle@piedpiper.com
6 | 5,Jared Dunn,jared@piedpiper.com
7 | 6,Monica Hall,monica@raviga.com
8 | 7,Gavin Belson,gavin@hooli.com


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/text-to-sql-json-mode/data/purchases.csv:
--------------------------------------------------------------------------------
1 | purchase_id,purchase_date,product_name,employee_id,amount
2 | 1,'2024-02-01',iPhone,1,750
3 | 2,'2024-02-02',Tesla,2,70000
4 | 3,'2024-02-03',Humane pin,3,500
5 | 4,'2024-02-04',iPhone,4,700
6 | 5,'2024-02-05',Tesla,5,75000


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/text-to-sql-json-mode/requirements.txt:
--------------------------------------------------------------------------------
1 | duckdb
2 | groq
3 | sqlparse
4 | pandas
5 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/verified-sql-function-calling/data/employees.csv:
--------------------------------------------------------------------------------
1 | employee_id,name,email
2 | 1,Richard Hendricks,richard@piedpiper.com
3 | 2,Erlich Bachman,erlich@aviato.com
4 | 3,Dinesh Chugtai,dinesh@piedpiper.com
5 | 4,Bertram Gilfoyle,gilfoyle@piedpiper.com
6 | 5,Jared Dunn,jared@piedpiper.com
7 | 6,Monica Hall,monica@raviga.com
8 | 7,Gavin Belson,gavin@hooli.com


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/verified-sql-function-calling/data/purchases.csv:
--------------------------------------------------------------------------------
1 | purchase_id,purchase_date,product_name,employee_id,amount
2 | 1,'2024-02-01',iPhone,1,750
3 | 2,'2024-02-02',Tesla,2,70000
4 | 3,'2024-02-03',Humane pin,3,500
5 | 4,'2024-02-04',iPhone,4,700
6 | 5,'2024-02-05',Tesla,5,75000


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/verified-sql-function-calling/requirements.txt:
--------------------------------------------------------------------------------
1 | groq
2 | sentence-transformers
3 | langchain_community
4 | scikit-learn
5 | numpy
6 | duckdb
7 | pyyaml
8 | sqlparse
9 | tabulate


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/verified-sql-function-calling/verified-queries/employees-without-purchases.yaml:
--------------------------------------------------------------------------------
1 | description: Employees without a purchase since Feb 1, 2024
2 | sql: |
3 |   SELECT employees.name as employees_without_purchases
4 |   FROM employees.csv AS employees
5 |   LEFT JOIN purchases.csv AS purchases ON employees.employee_id = purchases.employee_id
6 |   AND purchases.purchase_date > '2024-02-01'
7 |   WHERE purchases.purchase_id IS NULL
8 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/verified-sql-function-calling/verified-queries/most-expensive-purchase.yaml:
--------------------------------------------------------------------------------
 1 | description: Employee with the most expensive purchase
 2 | sql: |
 3 |   SELECT employees.name AS employee_name,
 4 |         MAX(amount) AS max_purchase_amount
 5 |   FROM purchases.csv AS purchases
 6 |   JOIN employees.csv AS employees ON purchases.employee_id = employees.employee_id
 7 |   GROUP BY employees.name
 8 |   ORDER BY max_purchase_amount DESC
 9 |   LIMIT 1
10 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/verified-sql-function-calling/verified-queries/most-recent-purchases.yaml:
--------------------------------------------------------------------------------
 1 | description: Five most recent purchases
 2 | sql: |
 3 |   SELECT purchases.product_name,
 4 |          purchases.amount,
 5 |          employees.name
 6 |   FROM purchases.csv AS purchases
 7 |   JOIN employees.csv AS employees ON purchases.employee_id = employees.employee_id
 8 |   ORDER BY purchases.purchase_date DESC
 9 |   LIMIT 5;
10 | 


--------------------------------------------------------------------------------
/3p-integrations/groq/groq-example-templates/verified-sql-function-calling/verified-queries/number-of-teslas.yaml:
--------------------------------------------------------------------------------
1 | description: Number of Teslas purchased
2 | sql: |
3 |   SELECT COUNT(*) as number_of_teslas
4 |   FROM purchases.csv AS p
5 |   JOIN employees.csv AS e ON e.employee_id = p.employee_id
6 |   WHERE p.product_name = 'Tesla'
7 | 


--------------------------------------------------------------------------------
/3p-integrations/lamini/text2sql_memory_tuning/README.md:
--------------------------------------------------------------------------------
 1 | # Tune Llama 3 for text-to-SQL and improve accuracy from 30% to 95%
 2 | 
 3 | This repo and notebook `meta_lamini.ipynb` demonstrate how to tune Llama 3 to generate valid SQL queries and improve accuracy from 30% to 95%.
 4 | 
 5 | In this notebook we'll be using Lamini, and more specifically, Lamini Memory Tuning.
 6 | 
 7 | Lamini is an integrated platform for LLM inference and tuning for the enterprise. Lamini Memory Tuning is a new tool you can use to embed facts into LLMs that improves factual accuracy and reduces hallucinations. Inspired by information retrieval, this method has set a new standard of accuracy for LLMs with less developer effort.
 8 | 
 9 | Learn more about Lamini Memory Tuning: https://www.lamini.ai/blog/lamini-memory-tuning
10 | 
11 | Please head over to https://app.lamini.ai/account to get your free api key.
12 | 
13 | You can authenticate by writing the following to a file `~/.lamini/configure.yaml`
14 | 
15 | ```
16 | production:
17 |     key: <YOUR-LAMINI-API-KEY>
18 | ```
19 | 
20 | This tuning tutorial uses the `nba_roster` sqlite database to tune a Llama 3 model.
21 | 
22 | ## Additional resources
23 | 
24 | ▫️ Fortune 500 case study: http://www.lamini.ai/blog/llm-text-to-sql <br>
25 | ▫️ Technical paper: https://github.com/lamini-ai/Lamini-Memory-Tuning/blob/main/research-paper.pdf <br>
26 | ▫️ Model weights: https://huggingface.co/engineering-lamini/lamini-1-random
27 | 


--------------------------------------------------------------------------------
/3p-integrations/lamini/text2sql_memory_tuning/assets/manual_filtering.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/lamini/text2sql_memory_tuning/assets/manual_filtering.png


--------------------------------------------------------------------------------
/3p-integrations/lamini/text2sql_memory_tuning/assets/website.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/lamini/text2sql_memory_tuning/assets/website.png


--------------------------------------------------------------------------------
/3p-integrations/lamini/text2sql_memory_tuning/nba_roster.db:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/lamini/text2sql_memory_tuning/nba_roster.db


--------------------------------------------------------------------------------
/3p-integrations/lamini/text2sql_memory_tuning/util/get_default_finetune_args.py:
--------------------------------------------------------------------------------
1 | def get_default_finetune_args():
2 |     return {
3 |         "learning_rate": 0.0003,
4 |         "max_steps": 60,
5 |         "early_stopping": False,
6 |         "load_best_model_at_end": False,
7 |         "peft_args": {"r_value": 32},
8 |     }
9 | 


--------------------------------------------------------------------------------
/3p-integrations/lamini/text2sql_memory_tuning/util/get_rubric.py:
--------------------------------------------------------------------------------
 1 | def get_rubric():
 2 |     prompt = (
 3 |         "Read this scoring rubric carefully and follow the instructions precisely:\n"
 4 |     )
 5 |     prompt += (
 6 |         "A score of 5 means that model's value is the same as the gold answer's id.\n"
 7 |     )
 8 |     prompt += "A score of 4 means that the model's answer is the same or a paraphrase of the gold answer, but the value may not be an exact match.\n"
 9 |     prompt += "A score of 3 means that the model's answer is similar as the gold answer's description, but the value may be wrong. Both answers may indicate that revenue is increased but the gold says 12 percent and the model say 50 million USD.\n"
10 |     prompt += "A score of 2 means that the model's answer is not similar to the gold answer, but the answer is plausible.\n"
11 |     prompt += "A score of 1 means that the model's answer is not similar to the gold answer, and the answer doesn't make sense.\n"
12 | 
13 |     prompt += "Assign a 5 for a correct value even if other fields are missing.\n"
14 | 
15 |     return prompt
16 | 


--------------------------------------------------------------------------------
/3p-integrations/lamini/text2sql_memory_tuning/util/get_schema.py:
--------------------------------------------------------------------------------
 1 | def get_schema():
 2 |     return """\
 3 | 0|Team|TEXT eg. "Toronto Raptors"
 4 | 1|NAME|TEXT eg. "Otto Porter Jr."
 5 | 2|Jersey|TEXT eg. "0" and when null has a value "NA"
 6 | 3|POS|TEXT eg. "PF"
 7 | 4|AGE|INT eg. "22" in years
 8 | 5|HT|TEXT eg. `6' 7"` or `6' 10"`
 9 | 6|WT|TEXT eg. "232 lbs" 
10 | 7|COLLEGE|TEXT eg. "Michigan" and when null has a value "--"
11 | 8|SALARY|TEXT eg. "$9,945,830" and when null has a value "--"
12 | """
13 | 


--------------------------------------------------------------------------------
/3p-integrations/lamini/text2sql_memory_tuning/util/load_dataset.py:
--------------------------------------------------------------------------------
 1 | import jsonlines
 2 | 
 3 | from util.make_llama_3_prompt import make_llama_3_prompt
 4 | 
 5 | 
 6 | def load_training_data(args, make_question):
 7 |     path = f"data/training_data/{args.training_file_name}"
 8 | 
 9 |     limit = 1000
10 | 
11 |     with jsonlines.open(path) as reader:
12 |         for index, obj in enumerate(reversed(list(reader))):
13 |             if index >= limit:
14 |                 break
15 | 
16 |             yield {
17 |                 "input": make_llama_3_prompt(**make_question(obj)),
18 |                 "output": obj["sql"] + "<|eot_id|>",
19 |             }
20 | 
21 | 
22 | def get_dataset(args, make_question):
23 |     dataset = list(load_training_data(args, make_question))
24 |     return dataset
25 | 


--------------------------------------------------------------------------------
/3p-integrations/lamini/text2sql_memory_tuning/util/make_llama_3_prompt.py:
--------------------------------------------------------------------------------
1 | def make_llama_3_prompt(user, system=""):
2 |     system_prompt = ""
3 |     if system != "":
4 |         system_prompt = (
5 |             f"<|start_header_id|>system<|end_header_id|>\n\n{system}<|eot_id|>"
6 |         )
7 |     return f"<|begin_of_text|>{system_prompt}<|start_header_id|>user<|end_header_id|>\n\n{user}<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n"
8 | 


--------------------------------------------------------------------------------
/3p-integrations/lamini/text2sql_memory_tuning/util/parse_arguments.py:
--------------------------------------------------------------------------------
 1 | from argparse import ArgumentParser
 2 | 
 3 | 
 4 | def parse_arguments():
 5 |     parser = ArgumentParser()
 6 | 
 7 |     # The max number of examples to evaluate
 8 |     parser.add_argument(
 9 |         "--max-examples",
10 |         type=int,
11 |         default=100,
12 |         help="The max number of examples to evaluate",
13 |         required=False,
14 |     )
15 | 
16 |     parser.add_argument(
17 |         "--sql-model-name",
18 |         type=str,
19 |         default="meta-llama/Meta-Llama-3.1-8B-Instruct",
20 |         help="The model to use for text2sql",
21 |         required=False,
22 |     )
23 | 
24 |     parser.add_argument(
25 |         "--gold-file-name",
26 |         type=str,
27 |         default="gold-test-set.jsonl",
28 |         help="The gold dataset to use as seed",
29 |         required=False,
30 |     )
31 | 
32 |     parser.add_argument(
33 |         "--training-file-name",
34 |         type=str,
35 |         default="generated_queries.jsonl",
36 |         help="The training dataset",
37 |         required=False,
38 |     )
39 | 
40 |     return parser.parse_args()
41 | 


--------------------------------------------------------------------------------
/3p-integrations/lamini/text2sql_memory_tuning/util/setup_logging.py:
--------------------------------------------------------------------------------
 1 | import logging
 2 | 
 3 | 
 4 | def setup_logging():
 5 |     # Remove all handlers associated with the root logger object.
 6 |     for handler in logging.root.handlers[:]:
 7 |         logging.root.removeHandler(handler)
 8 | 
 9 |     logging.basicConfig(
10 |         level=logging.WARNING,
11 |         format="%(asctime)s [%(levelname)s] %(message)s",
12 |         handlers=[logging.StreamHandler()],
13 |     )
14 | 


--------------------------------------------------------------------------------
/3p-integrations/llamaindex/dlai_agentic_rag/README.md:
--------------------------------------------------------------------------------
 1 | # Building Agentic RAG with Llamaindex
 2 | 
 3 | The folder here contains the Llama 3 ported notebooks of the DLAI short course [Building Agentic RAG with Llamaindex](https://www.deeplearning.ai/short-courses/building-agentic-rag-with-llamaindex/).
 4 | 
 5 | 1. [Building Agentic RAG with Llamaindex L1 Router Engine](../../../end-to-end-use-cases/agents/DeepLearningai_Course_Notebooks/AI_Agents_in_LangGraph_L1_Build_an_Agent_from_Scratch.ipynb) shows how to implement a simple agentic RAG, a router that will pick up one of several query tools (question answering or summarization) to execute a query on a single document. Note this notebook is located in the `quickstart` folder.
 6 | 
 7 | 2. [Building Agentic RAG with Llamaindex L2 Tool Calling](Building_Agentic_RAG_with_Llamaindex_L2_Tool_Calling.ipynb) shows how to use Llama 3 to not only pick a function to execute, but also infer an argument to pass through the function.
 8 | 
 9 | 3. [Building Agentic RAG with Llamaindex L3 Building an Agent Reasoning Loop](Building_Agentic_RAG_with_Llamaindex_L3_Building_an_Agent_Reasoning_Loop.ipynb) shows how to define a complete agent reasoning loop to reason over tools and multiple steps on a complex question the user asks about a single document while maintaining memory.
10 | 
11 | 3. [Building Agentic RAG with Llamaindex L4 Building a Multi-Document Agent](Building_Agentic_RAG_with_Llamaindex_L4_Building_a_Multi-Document_Agent.ipynb) shows how to use an agent to handle multiple documents and increasing degrees of complexity.
12 | 


--------------------------------------------------------------------------------
/3p-integrations/modal/many-llamas-human-eval/run_e2e.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | set -euo pipefail
 3 | IFS=$'\n\t'
 4 | 
 5 | command -v modal >/dev/null 2>&1 || { echo >&2 "modal command not found. Install modal first! Aborting."; exit 1; }
 6 | 
 7 | echo 'downloading LLaMA 3.2 3B Instruct model'
 8 | echo 'make sure to create a Secret called huggingface on Modal and accept the LLaMA 3.2 license'
 9 | modal run download.py
10 | 
11 | echo 'deploying vLLM inference server'
12 | modal deploy inference.py
13 | 
14 | echo 'running HumanEval generation'
15 | modal run generate.py --data-dir test --no-dry-run --n 1000 --subsample 100
16 | 
17 | echo 'running HumanEval evaluation'
18 | modal run eval.py
19 | 
20 | echo 'generating graphs for pass@k and fail@k'
21 | modal run plot.py


--------------------------------------------------------------------------------
/3p-integrations/tgi/merge_lora_weights.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | import fire
 5 | import torch
 6 | from peft import PeftModel
 7 | from transformers import LlamaForCausalLM, LlamaTokenizer
 8 | 
 9 | 
10 | def main(base_model: str,
11 |          peft_model: str,
12 |          output_dir: str):
13 |         
14 |     model = LlamaForCausalLM.from_pretrained(
15 |         base_model,
16 |         load_in_8bit=False,
17 |         torch_dtype=torch.float16,
18 |         device_map="auto",
19 |         offload_folder="tmp", 
20 |     )
21 |     
22 |     tokenizer = LlamaTokenizer.from_pretrained(
23 |         base_model
24 |     )
25 |         
26 |     model = PeftModel.from_pretrained(
27 |         model, 
28 |         peft_model, 
29 |         torch_dtype=torch.float16,
30 |         device_map="auto",
31 |         offload_folder="tmp",
32 |     )
33 | 
34 |     model = model.merge_and_unload()
35 |     model.save_pretrained(output_dir)
36 |     tokenizer.save_pretrained(output_dir)
37 | 
38 | 
39 | if __name__ == "__main__":
40 |     fire.Fire(main)


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/BERTScore.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/BERTScore.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/CoQA.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/CoQA.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/ColPaliMaxSim-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/ColPaliMaxSim-1.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/Nvidia_collage.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/Nvidia_collage.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/UMAP.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/UMAP.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/cRAG.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/cRAG.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/cRAG_indexing.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/cRAG_indexing.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/cRAG_querytime.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/cRAG_querytime.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/cluster.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/cluster.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/colpali_arch.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/colpali_arch.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/conversation.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/conversation.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/deploy_CFT.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/deploy_CFT.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/ft_model.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/ft_model.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/mmrag_only.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/mmrag_only.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/page_25.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/page_25.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/repetition_task.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/repetition_task.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/reranking.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/reranking.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/semantic_search.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/semantic_search.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/simple_RAG.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/simple_RAG.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/structured_text_image.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/structured_text_image.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/summarization.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/summarization.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/summary_task.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/summary_task.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/text_RAG.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/text_RAG.png


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/together-color.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/together-color.jpg


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/together.gif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/together.gif


--------------------------------------------------------------------------------
/3p-integrations/togetherai/images/wandb_model.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/3p-integrations/togetherai/images/wandb_model.png


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) Meta Platforms, Inc. and affiliates
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining
 6 | a copy of this software and associated documentation files (the
 7 | "Software"), to deal in the Software without restriction, including
 8 | without limitation the rights to use, copy, modify, merge, publish,
 9 | distribute, sublicense, and/or sell copies of the Software, and to
10 | permit persons to whom the Software is furnished to do so, subject to
11 | the following conditions:
12 | 
13 | The above copyright notice and this permission notice shall be
14 | included in all copies or substantial portions of the Software.
15 | 
16 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
17 | EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18 | MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
19 | NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
20 | LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
21 | OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
22 | WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.


--------------------------------------------------------------------------------
/UPDATES.md:
--------------------------------------------------------------------------------
 1 | DIFFLOG:
 2 | <!-- markdown-link-check-disable -->
 3 | Nested Folders rename:
 4 | - /recipes/3p_integrations -> /3p-integrations
 5 | - /recipes/quickstart -> /getting-started
 6 | - /recipes/responsible_ai -> /end-to-end-use-cases/responsible_ai
 7 | - /recipes/use_cases -> /end-to-end-use-cases
 8 | - /quickstart/agents -> /end-to-end-use-cases/agents 
 9 | - /quickstart/NotebookLlama -> /end-to-end-use-cases/NotebookLlama
10 | - /quickstart/responsible_ai -> /end-to-end-use-cases/responsible_ai
11 | - /recipes/use_cases/end-toend/RAFT-Chatbot -> /end-to-end-use-cases/RAFT-Chatbot
12 | - /docs -> /src/docs/
13 | - /dev_requirements.txt -> /src/dev_requirements.txt
14 | - /requirements.txt -> /src/requirements.txt
15 | - /tools -> /end-to-end-use-cases/benchmarks/ 
16 | - /recipes/experimental/long_context -> /end-to-end-use-cases/long_context
17 | 
18 | 
19 | Removed folders:
20 | - /flagged (Empty folder)
21 | - /recipes/quickstart/Running_Llama3_Anywhere (Redundant code)
22 | - /recipes/quickstart/inference/codellama (deprecated model)
23 | - /recipes/quickstart/getting-to-know-llama-3.ipynb
24 | <!-- markdown-link-check-enable -->
25 | 


--------------------------------------------------------------------------------
/dev_requirements.txt:
--------------------------------------------------------------------------------
1 | vllm
2 | pytest-mock
3 | auditnlg


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/.gitignore:
--------------------------------------------------------------------------------
 1 | # Gradle files
 2 | .gradle/
 3 | build/
 4 | 
 5 | # Local configuration file (sdk path, etc)
 6 | local.properties
 7 | 
 8 | # Log/OS Files
 9 | *.log
10 | 
11 | # Android Studio generated files and folders
12 | captures/
13 | .externalNativeBuild/
14 | .cxx/
15 | *.apk
16 | output.json
17 | 
18 | # IntelliJ
19 | *.iml
20 | .idea/
21 | misc.xml
22 | deploymentTargetDropDown.xml
23 | render.experimental.xml
24 | 
25 | # Keystore files
26 | *.jks
27 | *.keystore
28 | 
29 | # Google Services (e.g. APIs or Firebase)
30 | google-services.json
31 | 
32 | # Android Profiling
33 | *.hprof
34 | 
35 | .DS_Store
36 | 
37 | *.jar
38 | *.aar
39 | *.so
40 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/README.md:
--------------------------------------------------------------------------------
 1 | # Android Document Summarizer App
 2 | 
 3 | 
 4 | <img src="./screenshot.png">
 5 | 
 6 | This is a sample Android app to demonstrate Llama 4 multimodal and multilingual capabilities. This app allows user to take a picture/screenshot of a document, and then summarize and translate it into any of the supported languages
 7 | 
 8 | ## Quick Start
 9 | 
10 | 1. Open the DocumentSummarizer folder in Android Studio
11 | 2. Update the `API_KEY` in `AppUtils.java`
12 | 3. Build the Android Project
13 | 4. Inside the app, tap on settings icon on top right
14 | 5. Configure the Remote URL endpoint (any supported providers that serve Llama 4 models. For example: https://api.together.xyz)
15 | 6. Select the desired model from the drop down list. If you need to add more models, modify `ModelUtils.java`
16 | 7. Go back to the Main chat window
17 | 8. Press the '+' button on the bottom left and select an image document (or take a picture of one!)
18 | 9. Select the 'globe' button on the bottom left and select your languages
19 | 10. Enter a prompt like "summarize this" and press Enter!
20 | 
21 | > **_NOTE:_**  This is an example project to demonstrate E2E flow. You should NOT use/store API key directly on client. Exposing your API key in client-side environments allows malicious users to take that key and make requests on your behalf. Requests should always be routed through your own backend server where you can keep your API key secure.
22 | 
23 | 
24 | ## Reporting Issues
25 | If you encountered any bugs or issues following this tutorial please file a bug/issue here on [Github](https://github.com/meta-llama/llama-cookbook/issues)).
26 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/.gitignore:
--------------------------------------------------------------------------------
1 | /build
2 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/proguard-rules.pro:
--------------------------------------------------------------------------------
 1 | # Add project specific ProGuard rules here.
 2 | # You can control the set of applied configuration files using the
 3 | # proguardFiles setting in build.gradle.
 4 | #
 5 | # For more details, see
 6 | #   http://developer.android.com/guide/developing/tools/proguard.html
 7 | 
 8 | # If your project uses WebView with JS, uncomment the following
 9 | # and specify the fully qualified class name to the JavaScript interface
10 | # class:
11 | #-keepclassmembers class fqcn.of.javascript.interface.for.webview {
12 | #   public *;
13 | #}
14 | 
15 | # Uncomment this to preserve the line number information for
16 | # debugging stack traces.
17 | #-keepattributes SourceFile,LineNumberTable
18 | 
19 | # If you keep the line number information, uncomment this to
20 | # hide the original source file name.
21 | #-renamesourcefileattribute SourceFile


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/java/com/example/llamaandroiddemo/AppLog.java:
--------------------------------------------------------------------------------
 1 | /*
 2 |  * Copyright (c) Meta Platforms, Inc. and affiliates.
 3 |  * All rights reserved.
 4 |  *
 5 |  * This source code is licensed under the BSD-style license found in the
 6 |  * LICENSE file in the root directory of this source tree.
 7 |  */
 8 | 
 9 | package com.example.llamaandroiddemo;
10 | 
11 | import java.text.SimpleDateFormat;
12 | import java.util.Date;
13 | import java.util.Locale;
14 | 
15 | public class AppLog {
16 |   private final Long timestamp;
17 |   private final String message;
18 | 
19 |   public AppLog(String message) {
20 |     this.timestamp = getCurrentTimeStamp();
21 |     this.message = message;
22 |   }
23 | 
24 |   public Long getTimestamp() {
25 |     return timestamp;
26 |   }
27 | 
28 |   public String getMessage() {
29 |     return message;
30 |   }
31 | 
32 |   public String getFormattedLog() {
33 |     return "[" + getFormattedTimeStamp() + "] " + message;
34 |   }
35 | 
36 |   private Long getCurrentTimeStamp() {
37 |     return System.currentTimeMillis();
38 |   }
39 | 
40 |   private String getFormattedTimeStamp() {
41 |     return formatDate(timestamp);
42 |   }
43 | 
44 |   private String formatDate(long milliseconds) {
45 |     SimpleDateFormat formatter = new SimpleDateFormat("yyyy-MM-dd  HH:mm:ss", Locale.getDefault());
46 |     Date date = new Date(milliseconds);
47 |     return formatter.format(date);
48 |   }
49 | }
50 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/java/com/example/llamaandroiddemo/AppLogging.java:
--------------------------------------------------------------------------------
 1 | /*
 2 |  * Copyright (c) Meta Platforms, Inc. and affiliates.
 3 |  * All rights reserved.
 4 |  *
 5 |  * This source code is licensed under the BSD-style license found in the
 6 |  * LICENSE file in the root directory of this source tree.
 7 |  */
 8 | 
 9 | package com.example.llamaandroiddemo;
10 | 
11 | import android.app.Application;
12 | import android.util.Log;
13 | import java.util.ArrayList;
14 | 
15 | public class AppLogging extends Application {
16 |   private static AppLogging singleton;
17 | 
18 |   private ArrayList<AppLog> logs;
19 |   private DemoSharedPreferences mDemoSharedPreferences;
20 | 
21 |   @Override
22 |   public void onCreate() {
23 |     super.onCreate();
24 |     singleton = this;
25 |     mDemoSharedPreferences = new DemoSharedPreferences(this.getApplicationContext());
26 |     logs = mDemoSharedPreferences.getSavedLogs();
27 |     if (logs == null) { // We don't have existing sharedPreference stored
28 |       logs = new ArrayList<>();
29 |     }
30 |   }
31 | 
32 |   public static AppLogging getInstance() {
33 |     return singleton;
34 |   }
35 | 
36 |   public void log(String message) {
37 |     AppLog appLog = new AppLog(message);
38 |     logs.add(appLog);
39 |     Log.d("AppLogging", appLog.getMessage());
40 |   }
41 | 
42 |   public ArrayList<AppLog> getLogs() {
43 |     return logs;
44 |   }
45 | 
46 |   public void clearLogs() {
47 |     logs.clear();
48 |     mDemoSharedPreferences.removeExistingLogs();
49 |   }
50 | 
51 |   public void saveLogs() {
52 |     mDemoSharedPreferences.saveLogs();
53 |   }
54 | }
55 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/java/com/example/llamaandroiddemo/AppUtils.java:
--------------------------------------------------------------------------------
 1 | package com.example.llamaandroiddemo;
 2 | 
 3 | public class AppUtils {
 4 | 	// Generation Mode
 5 | 	public static final int CONVERSATION_HISTORY_MESSAGE_LOOKBACK = 1;
 6 | 
 7 | 	// Note: This is an example project to demonstrate E2E flow.
 8 | 	// You should NOT use/store API key directly on client
 9 | 	// Exposing your API key in client-side environments allows malicious users to take
10 | 	// that key and make requests on your behalf. Requests should always be routed through
11 | 	// your own backend server where you can keep your API key secure.
12 | 	public static final String API_KEY = "";
13 | }
14 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/java/com/example/llamaandroiddemo/HomescreenActivity.kt:
--------------------------------------------------------------------------------
 1 | package com.example.llamaandroiddemo
 2 | 
 3 | import android.content.Intent
 4 | import androidx.appcompat.app.AppCompatActivity
 5 | import android.os.Bundle
 6 | import android.widget.Button
 7 | 
 8 | class HomescreenActivity : AppCompatActivity() {
 9 | 
10 |     private lateinit var startChatButton: Button
11 | 
12 |     override fun onCreate(savedInstanceState: Bundle?) {
13 |         super.onCreate(savedInstanceState)
14 |         setContentView(R.layout.activity_homescreen)
15 | 
16 |         // Initialize UI components
17 |         startChatButton = findViewById(R.id.btn_start_chat)
18 | 
19 |         // Set up start chat button click listener
20 |         startChatButton.setOnClickListener {
21 |             val intent = Intent(this, MainActivity::class.java)
22 |             startActivity(intent)
23 |         }
24 |     }
25 | }


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/java/com/example/llamaandroiddemo/LogsAdapter.java:
--------------------------------------------------------------------------------
 1 | /*
 2 |  * Copyright (c) Meta Platforms, Inc. and affiliates.
 3 |  * All rights reserved.
 4 |  *
 5 |  * This source code is licensed under the BSD-style license found in the
 6 |  * LICENSE file in the root directory of this source tree.
 7 |  */
 8 | 
 9 | package com.example.llamaandroiddemo;
10 | 
11 | import android.view.LayoutInflater;
12 | import android.view.View;
13 | import android.view.ViewGroup;
14 | import android.widget.ArrayAdapter;
15 | import android.widget.TextView;
16 | import androidx.annotation.NonNull;
17 | import java.util.Objects;
18 | 
19 | public class LogsAdapter extends ArrayAdapter<AppLog> {
20 |   public LogsAdapter(android.content.Context context, int resource) {
21 |     super(context, resource);
22 |   }
23 | 
24 |   static class ViewHolder {
25 |     private TextView logTextView;
26 |   }
27 | 
28 |   @NonNull
29 |   @Override
30 |   public View getView(int position, View convertView, @NonNull ViewGroup parent) {
31 |     ViewHolder mViewHolder = null;
32 | 
33 |     String logMessage = Objects.requireNonNull(getItem(position)).getFormattedLog();
34 | 
35 |     if (convertView == null || convertView.getTag() == null) {
36 |       mViewHolder = new ViewHolder();
37 |       convertView = LayoutInflater.from(getContext()).inflate(R.layout.logs_message, parent, false);
38 |       mViewHolder.logTextView = convertView.requireViewById(R.id.logsTextView);
39 |     } else {
40 |       mViewHolder = (ViewHolder) convertView.getTag();
41 |     }
42 |     mViewHolder.logTextView.setText(logMessage);
43 |     return convertView;
44 |   }
45 | }
46 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/java/com/example/llamaandroiddemo/MessageType.java:
--------------------------------------------------------------------------------
 1 | /*
 2 |  * Copyright (c) Meta Platforms, Inc. and affiliates.
 3 |  * All rights reserved.
 4 |  *
 5 |  * This source code is licensed under the BSD-style license found in the
 6 |  * LICENSE file in the root directory of this source tree.
 7 |  */
 8 | 
 9 | package com.example.llamaandroiddemo;
10 | 
11 | public enum MessageType {
12 |   TEXT,
13 |   IMAGE,
14 |   SYSTEM
15 | }
16 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/java/com/example/llamaandroiddemo/ModelType.java:
--------------------------------------------------------------------------------
 1 | /*
 2 |  * Copyright (c) Meta Platforms, Inc. and affiliates.
 3 |  * All rights reserved.
 4 |  *
 5 |  * This source code is licensed under the BSD-style license found in the
 6 |  * LICENSE file in the root directory of this source tree.
 7 |  */
 8 | 
 9 | package com.example.llamaandroiddemo;
10 | 
11 | public enum ModelType {
12 |   LLAMA_3,
13 |   LLAMA_3_1,
14 |   LLAMA_3_2,
15 |   LLAMA_GUARD_3,
16 | }
17 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/java/com/example/llamaandroiddemo/ModelUtils.java:
--------------------------------------------------------------------------------
 1 | /*
 2 |  * Copyright (c) Meta Platforms, Inc. and affiliates.
 3 |  * All rights reserved.
 4 |  *
 5 |  * This source code is licensed under the BSD-style license found in the
 6 |  * LICENSE file in the root directory of this source tree.
 7 |  */
 8 | 
 9 | package com.example.llamaandroiddemo;
10 | 
11 | import java.util.Arrays;
12 | import java.util.List;
13 | 
14 | public class ModelUtils {
15 |   public static List<String> getSupportedRemoteModels() {
16 |       // UPDATE THIS TO THE RELEVANT MODELS YOU WANT TO USE
17 |       // NOTE THAT SOME PROVIDERS MIGHT HAVE DIFFERENT MODEL NAMING FORMAT
18 |     return Arrays.asList(
19 |             "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
20 |             "meta-llama/Llama-4-Scout-17B-16E-Instruct"
21 |             );
22 |   }
23 | }
24 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/java/com/example/llamaandroiddemo/PromptFormat.java:
--------------------------------------------------------------------------------
 1 | /*
 2 |  * Copyright (c) Meta Platforms, Inc. and affiliates.
 3 |  * All rights reserved.
 4 |  *
 5 |  * This source code is licensed under the BSD-style license found in the
 6 |  * LICENSE file in the root directory of this source tree.
 7 |  */
 8 | 
 9 | package com.example.llamaandroiddemo;
10 | 
11 | public class PromptFormat {
12 |   public static final String DEFAULT_SYSTEM_PROMPT = "";
13 | 
14 | }
15 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/banner_shape.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <shape xmlns:android="http://schemas.android.com/apk/res/android"
3 |     android:shape="rectangle">
4 |     <solid android:color="#16293D" />
5 | </shape>


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/baseline_add_24.xml:
--------------------------------------------------------------------------------
1 | <vector xmlns:android="http://schemas.android.com/apk/res/android" android:height="24dp" android:tint="#FFFFFF" android:viewportHeight="24" android:viewportWidth="24" android:width="24dp">
2 |       
3 |     <path android:fillColor="@android:color/white" android:pathData="M19,13h-6v6h-2v-6H5v-2h6V5h2v6h6v2z"/>
4 |     
5 | </vector>
6 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/baseline_add_photo_alternate_24.xml:
--------------------------------------------------------------------------------
1 | <vector xmlns:android="http://schemas.android.com/apk/res/android" android:height="24dp" android:tint="#FFFFFF" android:viewportHeight="24" android:viewportWidth="24" android:width="24dp">
2 |       
3 |     <path android:fillColor="@android:color/white" android:pathData="M19,7v2.99s-1.99,0.01 -2,0L17,7h-3s0.01,-1.99 0,-2h3L17,2h2v3h3v2h-3zM16,11L16,8h-3L13,5L5,5c-1.1,0 -2,0.9 -2,2v12c0,1.1 0.9,2 2,2h12c1.1,0 2,-0.9 2,-2v-8h-3zM5,19l3,-4 2,3 3,-4 4,5L5,19z"/>
4 |     
5 | </vector>
6 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/baseline_article_24.xml:
--------------------------------------------------------------------------------
1 | <vector xmlns:android="http://schemas.android.com/apk/res/android" android:autoMirrored="true" android:height="24dp" android:tint="#FFFFFF
2 | " android:viewportHeight="24" android:viewportWidth="24" android:width="24dp">
3 |       
4 |     <path android:fillColor="@android:color/white" android:pathData="M19,3L5,3c-1.1,0 -2,0.9 -2,2v14c0,1.1 0.9,2 2,2h14c1.1,0 2,-0.9 2,-2L21,5c0,-1.1 -0.9,-2 -2,-2zM14,17L7,17v-2h7v2zM17,13L7,13v-2h10v2zM17,9L7,9L7,7h10v2z"/>
5 |     
6 | </vector>
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/baseline_close_24.xml:
--------------------------------------------------------------------------------
1 | <vector xmlns:android="http://schemas.android.com/apk/res/android" android:height="24dp" android:tint="#FFFFFF
2 | " android:viewportHeight="24" android:viewportWidth="24" android:width="24dp">
3 |       
4 |     <path android:fillColor="@android:color/white" android:pathData="M19,6.41L17.59,5 12,10.59 6.41,5 5,6.41 10.59,12 5,17.59 6.41,19 12,13.41 17.59,19 19,17.59 13.41,12z"/>
5 |     
6 | </vector>
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/baseline_delete_forever_24.xml:
--------------------------------------------------------------------------------
1 | <vector xmlns:android="http://schemas.android.com/apk/res/android" android:height="24dp" android:tint="#FFFFFF" android:viewportHeight="24" android:viewportWidth="24" android:width="24dp">
2 |       
3 |     <path android:fillColor="@android:color/white" android:pathData="M6,19c0,1.1 0.9,2 2,2h8c1.1,0 2,-0.9 2,-2L18,7L6,7v12zM8.46,11.88l1.41,-1.41L12,12.59l2.12,-2.12 1.41,1.41L13.41,14l2.12,2.12 -1.41,1.41L12,15.41l-2.12,2.12 -1.41,-1.41L10.59,14l-2.13,-2.12zM15.5,4l-1,-1h-5l-1,1L5,4v2h14L19,4z"/>
4 |     
5 | </vector>
6 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/baseline_language_24.xml:
--------------------------------------------------------------------------------
1 | <vector xmlns:android="http://schemas.android.com/apk/res/android" android:height="24dp" android:tint="#FFFFFF" android:viewportHeight="24" android:viewportWidth="24" android:width="24dp">
2 |       
3 |     <path android:fillColor="@android:color/white" android:pathData="M11.99,2C6.47,2 2,6.48 2,12s4.47,10 9.99,10C17.52,22 22,17.52 22,12S17.52,2 11.99,2zM18.92,8h-2.95c-0.32,-1.25 -0.78,-2.45 -1.38,-3.56 1.84,0.63 3.37,1.91 4.33,3.56zM12,4.04c0.83,1.2 1.48,2.53 1.91,3.96h-3.82c0.43,-1.43 1.08,-2.76 1.91,-3.96zM4.26,14C4.1,13.36 4,12.69 4,12s0.1,-1.36 0.26,-2h3.38c-0.08,0.66 -0.14,1.32 -0.14,2 0,0.68 0.06,1.34 0.14,2L4.26,14zM5.08,16h2.95c0.32,1.25 0.78,2.45 1.38,3.56 -1.84,-0.63 -3.37,-1.9 -4.33,-3.56zM8.03,8L5.08,8c0.96,-1.66 2.49,-2.93 4.33,-3.56C8.81,5.55 8.35,6.75 8.03,8zM12,19.96c-0.83,-1.2 -1.48,-2.53 -1.91,-3.96h3.82c-0.43,1.43 -1.08,2.76 -1.91,3.96zM14.34,14L9.66,14c-0.09,-0.66 -0.16,-1.32 -0.16,-2 0,-0.68 0.07,-1.35 0.16,-2h4.68c0.09,0.65 0.16,1.32 0.16,2 0,0.68 -0.07,1.34 -0.16,2zM14.59,19.56c0.6,-1.11 1.06,-2.31 1.38,-3.56h2.95c-0.96,1.65 -2.49,2.93 -4.33,3.56zM16.36,14c0.08,-0.66 0.14,-1.32 0.14,-2 0,-0.68 -0.06,-1.34 -0.14,-2h3.38c0.16,0.64 0.26,1.31 0.26,2s-0.1,1.36 -0.26,2h-3.38z"/>
4 |     
5 | </vector>
6 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/baseline_restart_alt_24.xml:
--------------------------------------------------------------------------------
1 | <vector android:height="24dp" android:tint="#FFFFFF"
2 |     android:viewportHeight="24" android:viewportWidth="24"
3 |     android:width="24dp" xmlns:android="http://schemas.android.com/apk/res/android">
4 |     <path android:fillColor="@android:color/white" android:pathData="M12,5V2L8,6l4,4V7c3.31,0 6,2.69 6,6c0,2.97 -2.17,5.43 -5,5.91v2.02c3.95,-0.49 7,-3.85 7,-7.93C20,8.58 16.42,5 12,5z"/>
5 |     <path android:fillColor="@android:color/white" android:pathData="M6,13c0,-1.65 0.67,-3.15 1.76,-4.24L6.34,7.34C4.9,8.79 4,10.79 4,13c0,4.08 3.05,7.44 7,7.93v-2.02C8.17,18.43 6,15.97 6,13z"/>
6 | </vector>
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/baseline_send_24.xml:
--------------------------------------------------------------------------------
1 | <vector android:autoMirrored="true" android:height="24dp"
2 |     android:tint="#FFFFFF
3 | " android:viewportHeight="24"
4 |     android:viewportWidth="24" android:width="24dp" xmlns:android="http://schemas.android.com/apk/res/android">
5 |     <path android:fillColor="@android:color/white" android:pathData="M2.01,21L23,12 2.01,3 2,10l15,2 -15,2z"/>
6 | </vector>
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/baseline_stop_24.xml:
--------------------------------------------------------------------------------
1 | <vector xmlns:android="http://schemas.android.com/apk/res/android" android:height="24dp" android:tint="#FFFFFF
2 | " android:viewportHeight="24" android:viewportWidth="24" android:width="24dp">
3 |       
4 |     <path android:fillColor="@android:color/white" android:pathData="M6,6h12v12H6z"/>
5 |     
6 | </vector>
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/btn.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <selector xmlns:android="http://schemas.android.com/apk/res/android">
3 |     <!-- Disable background -->
4 |     <item android:state_enabled="false"
5 |         android:color="@color/btn_disabled"/>
6 |     <!-- Enabled background -->
7 |     <item android:color="@color/btn_enabled"/>
8 | </selector>


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/chat_background.xml:
--------------------------------------------------------------------------------
 1 | <vector xmlns:android="http://schemas.android.com/apk/res/android"
 2 |     xmlns:aapt="http://schemas.android.com/aapt"
 3 |     android:width="412dp"
 4 |     android:height="893dp"
 5 |     android:viewportWidth="412"
 6 |     android:viewportHeight="893">
 7 |   <path
 8 |       android:pathData="M0,0h412v893h-412z">
 9 |     <aapt:attr name="android:fillColor">
10 |       <gradient 
11 |           android:startX="206"
12 |           android:startY="0"
13 |           android:endX="206"
14 |           android:endY="893"
15 |           android:type="linear">
16 |         <item android:offset="0.05" android:color="#FF16293D"/>
17 |         <item android:offset="0.9" android:color="#FF192E4D"/>
18 |       </gradient>
19 |     </aapt:attr>
20 |   </path>
21 | </vector>
22 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/custom_button_round.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <shape xmlns:android="http://schemas.android.com/apk/res/android" android:shape="rectangle">
3 |     <solid android:color="#6080F0"/>
4 |     <corners android:radius="500dp"/>
5 |     <size android:width="100dp"
6 |         android:height="100dp"/>
7 | </shape>


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/expand_circle_down.xml:
--------------------------------------------------------------------------------
 1 | <vector xmlns:android="http://schemas.android.com/apk/res/android"
 2 |     android:width="24dp"
 3 |     android:height="18dp"
 4 |     android:viewportWidth="15"
 5 |     android:viewportHeight="10">
 6 |   <path
 7 |       android:pathData="M15,2.373L7.5,10L0,2.373L2.375,0L7.5,5.212L12.625,0L15,2.373Z"
 8 |       android:fillColor="#F4F4F4"/>
 9 | </vector>
10 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/ic_launcher_foreground.xml:
--------------------------------------------------------------------------------
 1 | <vector xmlns:android="http://schemas.android.com/apk/res/android"
 2 |     xmlns:aapt="http://schemas.android.com/aapt"
 3 |     android:width="108dp"
 4 |     android:height="108dp"
 5 |     android:viewportWidth="108"
 6 |     android:viewportHeight="108">
 7 |     <path android:pathData="M31,63.928c0,0 6.4,-11 12.1,-13.1c7.2,-2.6 26,-1.4 26,-1.4l38.1,38.1L107,108.928l-32,-1L31,63.928z">
 8 |         <aapt:attr name="android:fillColor">
 9 |             <gradient
10 |                 android:endX="85.84757"
11 |                 android:endY="92.4963"
12 |                 android:startX="42.9492"
13 |                 android:startY="49.59793"
14 |                 android:type="linear">
15 |                 <item
16 |                     android:color="#44000000"
17 |                     android:offset="0.0" />
18 |                 <item
19 |                     android:color="#00000000"
20 |                     android:offset="1.0" />
21 |             </gradient>
22 |         </aapt:attr>
23 |     </path>
24 |     <path
25 |         android:fillColor="#FFFFFF"
26 |         android:fillType="nonZero"
27 |         android:pathData="M65.3,45.828l3.8,-6.6c0.2,-0.4 0.1,-0.9 -0.3,-1.1c-0.4,-0.2 -0.9,-0.1 -1.1,0.3l-3.9,6.7c-6.3,-2.8 -13.4,-2.8 -19.7,0l-3.9,-6.7c-0.2,-0.4 -0.7,-0.5 -1.1,-0.3C38.8,38.328 38.7,38.828 38.9,39.228l3.8,6.6C36.2,49.428 31.7,56.028 31,63.928h46C76.3,56.028 71.8,49.428 65.3,45.828zM43.4,57.328c-0.8,0 -1.5,-0.5 -1.8,-1.2c-0.3,-0.7 -0.1,-1.5 0.4,-2.1c0.5,-0.5 1.4,-0.7 2.1,-0.4c0.7,0.3 1.2,1 1.2,1.8C45.3,56.528 44.5,57.328 43.4,57.328L43.4,57.328zM64.6,57.328c-0.8,0 -1.5,-0.5 -1.8,-1.2s-0.1,-1.5 0.4,-2.1c0.5,-0.5 1.4,-0.7 2.1,-0.4c0.7,0.3 1.2,1 1.2,1.8C66.5,56.528 65.6,57.328 64.6,57.328L64.6,57.328z"
28 |         android:strokeWidth="1"
29 |         android:strokeColor="#00000000" />
30 | </vector>
31 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/input_text_shape.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <shape xmlns:android="http://schemas.android.com/apk/res/android"
3 |     android:shape="rectangle">
4 |     <solid android:color="#081D2C" />
5 |     <corners android:radius="20dp"/>
6 |     <padding android:layout_marginTop="5dp" android:layout_marginBottom="5dp" android:left="10dp" android:right="10dp"/>
7 | </shape>


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/outline_add_box_48.xml:
--------------------------------------------------------------------------------
1 | <vector xmlns:android="http://schemas.android.com/apk/res/android" android:height="48dp" android:tint="#ffffff
2 | " android:viewportHeight="24" android:viewportWidth="24" android:width="48dp">
3 |       
4 |     <path android:fillColor="@android:color/white" android:pathData="M19,3L5,3c-1.11,0 -2,0.9 -2,2v14c0,1.1 0.89,2 2,2h14c1.1,0 2,-0.9 2,-2L21,5c0,-1.1 -0.9,-2 -2,-2zM19,19L5,19L5,5h14v14zM11,17h2v-4h4v-2h-4L13,7h-2v4L7,11v2h4z"/>
5 |     
6 | </vector>
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/outline_camera_alt_48.xml:
--------------------------------------------------------------------------------
1 | <vector xmlns:android="http://schemas.android.com/apk/res/android" android:height="48dp" android:tint="#000000" android:viewportHeight="24" android:viewportWidth="24" android:width="48dp">
2 |       
3 |     <path android:fillColor="@android:color/white" android:pathData="M20,4h-3.17L15,2L9,2L7.17,4L4,4c-1.1,0 -2,0.9 -2,2v12c0,1.1 0.9,2 2,2h16c1.1,0 2,-0.9 2,-2L22,6c0,-1.1 -0.9,-2 -2,-2zM20,18L4,18L4,6h4.05l1.83,-2h4.24l1.83,2L20,6v12zM12,7c-2.76,0 -5,2.24 -5,5s2.24,5 5,5 5,-2.24 5,-5 -2.24,-5 -5,-5zM12,15c-1.65,0 -3,-1.35 -3,-3s1.35,-3 3,-3 3,1.35 3,3 -1.35,3 -3,3z"/>
4 |     
5 | </vector>
6 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/outline_image_48.xml:
--------------------------------------------------------------------------------
1 | <vector xmlns:android="http://schemas.android.com/apk/res/android" android:height="48dp" android:tint="#000000" android:viewportHeight="24" android:viewportWidth="24" android:width="48dp">
2 |       
3 |     <path android:fillColor="@android:color/white" android:pathData="M19,5v14L5,19L5,5h14m0,-2L5,3c-1.1,0 -2,0.9 -2,2v14c0,1.1 0.9,2 2,2h14c1.1,0 2,-0.9 2,-2L21,5c0,-1.1 -0.9,-2 -2,-2zM14.14,11.86l-3,3.87L9,13.14 6,17h12l-3.86,-5.14z"/>
4 |     
5 | </vector>
6 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/prompt_shape.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <shape xmlns:android="http://schemas.android.com/apk/res/android"
3 | android:shape="rectangle">
4 | <solid android:color="#081D2C" />
5 | <corners android:radius="4dp" />
6 | </shape>


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/received_message.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <shape xmlns:android="http://schemas.android.com/apk/res/android"
3 |     android:shape="rectangle">
4 |     <solid android:color="#081D2C" />
5 |     <corners android:radius="10dp" />
6 | </shape>
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/sent_message.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <shape xmlns:android="http://schemas.android.com/apk/res/android"
3 |     android:shape="rectangle">
4 |     <solid android:color="@color/colorPrimary" />
5 |     <corners android:radius="10dp" />
6 | </shape>
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/summarizer.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/summarizer.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/drawable/three_dots.xml:
--------------------------------------------------------------------------------
1 | <vector android:height="24dp" android:tint="#000000"
2 |     android:viewportHeight="24" android:viewportWidth="24"
3 |     android:width="24dp" xmlns:android="http://schemas.android.com/apk/res/android">
4 |     <path android:fillColor="@android:color/white" android:pathData="M6,10c-1.1,0 -2,0.9 -2,2s0.9,2 2,2 2,-0.9 2,-2 -0.9,-2 -2,-2zM18,10c-1.1,0 -2,0.9 -2,2s0.9,2 2,2 2,-0.9 2,-2 -0.9,-2 -2,-2zM12,10c-1.1,0 -2,0.9 -2,2s0.9,2 2,2 2,-0.9 2,-2 -0.9,-2 -2,-2z"/>
5 | </vector>
6 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/layout/activity_benchmarking.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <LinearLayout xmlns:android="http://schemas.android.com/apk/res/android"
 3 |     xmlns:tools="http://schemas.android.com/tools"
 4 |     android:layout_width="match_parent"
 5 |     android:layout_height="match_parent"
 6 |     android:orientation="vertical"
 7 |     android:clipToPadding="false"
 8 |     android:focusableInTouchMode="true"
 9 |     tools:context=".LlmBenchmarkRunner">
10 | 
11 |     <TextView
12 |         android:layout_width="match_parent"
13 |         android:layout_height="match_parent"
14 |         android:id="@+id/log_view" />
15 | 
16 | </LinearLayout>
17 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/layout/logs_message.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <LinearLayout xmlns:android="http://schemas.android.com/apk/res/android"
 3 |     xmlns:app="http://schemas.android.com/apk/res-auto"
 4 |     xmlns:tools="http://schemas.android.com/tools"
 5 |     android:layout_width="match_parent"
 6 |     android:layout_height="wrap_content"
 7 |     android:layout_marginTop="10dp">
 8 | 
 9 |         <TextView
10 |             android:id="@+id/logsTextView"
11 |             android:layout_width="match_parent"
12 |             android:layout_height="wrap_content"
13 |             android:padding="8dp"
14 |             android:text="TextView" />
15 | 
16 | </LinearLayout>


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/layout/system_message.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <RelativeLayout xmlns:android="http://schemas.android.com/apk/res/android"
 3 |     android:layout_width="match_parent"
 4 |     android:layout_height="wrap_content"
 5 |     android:paddingVertical="10dp"
 6 |     android:paddingLeft="15dp"
 7 |     android:paddingRight="60dp"
 8 |     android:clipToPadding="false">
 9 | 
10 |     <TextView
11 |         android:id="@+id/message_text"
12 |         android:layout_width="match_parent"
13 |         android:layout_height="wrap_content"
14 |         android:layout_centerHorizontal="true"
15 |         android:elevation="2dp"
16 |         android:paddingHorizontal="16dp"
17 |         android:paddingVertical="12dp"
18 |         android:text="Generated text"
19 |         android:textAlignment="center"
20 |         android:textColor="#9C9C9C"
21 |         android:textSize="15dp" />
22 | 
23 | </RelativeLayout>


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-anydpi-v26/ic_launcher.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
3 |     <background android:drawable="@drawable/ic_launcher_background" />
4 |     <foreground android:drawable="@drawable/ic_launcher_foreground" />
5 |     <monochrome android:drawable="@drawable/ic_launcher_foreground" />
6 | </adaptive-icon>
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
3 |     <background android:drawable="@drawable/ic_launcher_background" />
4 |     <foreground android:drawable="@drawable/ic_launcher_foreground" />
5 |     <monochrome android:drawable="@drawable/ic_launcher_foreground" />
6 | </adaptive-icon>
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-hdpi/ic_launcher.webp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-hdpi/ic_launcher.webp


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-hdpi/ic_launcher_round.webp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-hdpi/ic_launcher_round.webp


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-mdpi/ic_launcher.webp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-mdpi/ic_launcher.webp


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-mdpi/ic_launcher_round.webp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-mdpi/ic_launcher_round.webp


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xhdpi/ic_launcher.webp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xhdpi/ic_launcher.webp


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xhdpi/ic_launcher_round.webp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xhdpi/ic_launcher_round.webp


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xxhdpi/ic_launcher.webp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xxhdpi/ic_launcher.webp


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.webp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.webp


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xxxhdpi/ic_launcher.webp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xxxhdpi/ic_launcher.webp


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.webp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.webp


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/values/colors.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <resources>
 3 |     <color name="colorPrimary">#4294F0</color>
 4 |     <color name="colorPrimaryDark">#3700B3</color>
 5 |     <color name="colorAccent">#03DAC5</color>
 6 |     <color name="btn_enabled">#007CBA</color>
 7 |     <color name="btn_disabled">#A2A4B6</color>
 8 |     <color name="nav_bar">#16293D</color>
 9 |     <color name="status_bar">#16293D</color>
10 | </resources>
11 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/values/strings.xml:
--------------------------------------------------------------------------------
1 | <resources>
2 |     <string name="app_name">Llama Demo</string>
3 |     <string name="demo_pref_file_key">DemoPrefFileKey</string>
4 |     <string name="saved_messages_json_key">SavedMessagesJsonKey</string>
5 |     <string name="settings_json_key">SettingsJsonKey</string>
6 |     <string name="logs_json_key">LogsJsonKey</string>
7 |     <string name="start_chat_button_text">Start Chat</string>
8 | </resources>
9 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/values/styles.xml:
--------------------------------------------------------------------------------
 1 | <resources>
 2 |     <!-- Base application theme. -->
 3 |     <style name="AppTheme" parent="Theme.AppCompat.Light.DarkActionBar">
 4 |         <!-- Customize your theme here. -->
 5 |         <item name="colorPrimary">@color/colorPrimary</item>
 6 |         <item name="colorPrimaryDark">@color/colorPrimaryDark</item>
 7 |         <item name="colorAccent">@color/colorAccent</item>
 8 |     </style>
 9 | 
10 |     <style name="DefaultButton" parent="Theme.AppCompat.Light.DarkActionBar">
11 |         <item name="colorButtonNormal">@drawable/btn</item>
12 |         <item name="android:textColor">@color/colorPrimaryDark</item>
13 |     </style>
14 | </resources>
15 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/values/themes.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <resources>
3 |     <style name="Theme.ExecuTorchLlamaDemo" parent="android:Theme.Light" />
4 | </resources>
5 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/xml/backup_rules.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?><!--
 2 |    Sample backup rules file; uncomment and customize as necessary.
 3 |    See https://developer.android.com/guide/topics/data/autobackup
 4 |    for details.
 5 |    Note: This file is ignored for devices older that API 31
 6 |    See https://developer.android.com/about/versions/12/backup-restore
 7 | -->
 8 | <full-backup-content>
 9 |     <!--
10 |    <include domain="sharedpref" path="."/>
11 |    <exclude domain="sharedpref" path="device.xml"/>
12 | -->
13 | </full-backup-content>
14 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/xml/data_extraction_rules.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?><!--
 2 |    Sample data extraction rules file; uncomment and customize as necessary.
 3 |    See https://developer.android.com/about/versions/12/backup-restore#xml-changes
 4 |    for details.
 5 | -->
 6 | <data-extraction-rules>
 7 |     <cloud-backup>
 8 |         <!-- TODO: Use <include> and <exclude> to control what is backed up.
 9 |         <include .../>
10 |         <exclude .../>
11 |         -->
12 |     </cloud-backup>
13 |     <!--
14 |     <device-transfer>
15 |         <include .../>
16 |         <exclude .../>
17 |     </device-transfer>
18 |     -->
19 | </data-extraction-rules>
20 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/app/src/main/res/xml/file_paths.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <paths xmlns:android="http://schemas.android.com/apk/res/android">
3 |     <external-cache-path name="my_cache" path="." />
4 | </paths>


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/build.gradle.kts:
--------------------------------------------------------------------------------
 1 | /*
 2 |  * Copyright (c) Meta Platforms, Inc. and affiliates.
 3 |  * All rights reserved.
 4 |  *
 5 |  * This source code is licensed under the BSD-style license found in the
 6 |  * LICENSE file in the root directory of this source tree.
 7 |  */
 8 | 
 9 | // Top-level build file where you can add configuration options common to all sub-projects/modules.
10 | plugins {
11 |   id("com.android.application") version "8.1.0" apply false
12 |   id("org.jetbrains.kotlin.android") version "1.8.10" apply false
13 | }
14 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/gradle.properties:
--------------------------------------------------------------------------------
 1 | # Project-wide Gradle settings.
 2 | # IDE (e.g. Android Studio) users:
 3 | # Gradle settings configured through the IDE *will override*
 4 | # any settings specified in this file.
 5 | # For more details on how to configure your build environment visit
 6 | # http://www.gradle.org/docs/current/userguide/build_environment.html
 7 | # Specifies the JVM arguments used for the daemon process.
 8 | # The setting is particularly useful for tweaking memory settings.
 9 | org.gradle.jvmargs=-Xmx2048m -Dfile.encoding=UTF-8
10 | # When configured, Gradle will run in incubating parallel mode.
11 | # This option should only be used with decoupled projects. More details, visit
12 | # http://www.gradle.org/docs/current/userguide/multi_project_builds.html#sec:decoupled_projects
13 | # org.gradle.parallel=true
14 | # AndroidX package structure to make it clearer which packages are bundled with the
15 | # Android operating system, and which are packaged with your app's APK
16 | # https://developer.android.com/topic/libraries/support-library/androidx-rn
17 | android.useAndroidX=true
18 | # Kotlin code style for this project: "official" or "obsolete":
19 | kotlin.code.style=official
20 | # Enables namespacing of each library's R class so that its R class includes only the
21 | # resources declared in the library itself and none from the library's dependencies,
22 | # thereby reducing the size of the R class for that library
23 | android.nonTransitiveRClass=true
24 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/gradle/wrapper/gradle-wrapper.properties:
--------------------------------------------------------------------------------
1 | #Mon Sep 25 11:23:11 PDT 2023
2 | distributionBase=GRADLE_USER_HOME
3 | distributionPath=wrapper/dists
4 | distributionUrl=https\://services.gradle.org/distributions/gradle-8.0-bin.zip
5 | zipStoreBase=GRADLE_USER_HOME
6 | zipStorePath=wrapper/dists
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/screenshot.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/ArticleSummarizer/screenshot.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/ArticleSummarizer/settings.gradle.kts:
--------------------------------------------------------------------------------
 1 | /*
 2 |  * Copyright (c) Meta Platforms, Inc. and affiliates.
 3 |  * All rights reserved.
 4 |  *
 5 |  * This source code is licensed under the BSD-style license found in the
 6 |  * LICENSE file in the root directory of this source tree.
 7 |  */
 8 | 
 9 | pluginManagement {
10 |   repositories {
11 |     google()
12 |     mavenCentral()
13 |     gradlePluginPortal()
14 |   }
15 | }
16 | 
17 | dependencyResolutionManagement {
18 |   repositoriesMode.set(RepositoriesMode.FAIL_ON_PROJECT_REPOS)
19 |   repositories {
20 |     google()
21 |     mavenCentral()
22 |   }
23 | }
24 | 
25 | rootProject.name = "Llama Android Demo"
26 | 
27 | include(":app")
28 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/Contextual-Chunking-RAG/README.md:
--------------------------------------------------------------------------------
 1 | # Contextual keywords generation for RAG using Llama-3.1
 2 | 
 3 | **Problem**: Independent chunking in traditional RAG systems leads to the loss of contextual information between chunks. This makes it difficult for LLMs to retrieve relevant data when context (e.g., the subject or entity being discussed) is not explicitly repeated within individual chunks.
 4 | 
 5 | **Solution**: Generate keywords for each chunk to fulfill missing contextual information. These keywords (e.g., "BMW, X5, pricing") enrich the chunk with necessary context, ensuring better retrieval accuracy. By embedding this enriched metadata, the system bridges gaps between related chunks, enabling effective query matching and accurate answer generation.
 6 | 
 7 | [This article](https://medium.com/@ailabs/overcoming-independent-chunking-in-rag-systems-a-hybrid-approach-5d2c205b3732) explains benefits of contextual chunking.
 8 | 
 9 | **Note** This method does not require calling LLM for each chunk separately, which makes it efficient.
10 | 
11 | **Getting started**
12 | In this cookbook, we’ll use DeepInfra for Llama inference services, so be sure to obtain an API key from https://deepinfra.com/.
13 | You'll also need a LlamaParse API key to parse PDF files, which can be obtained from https://www.llamaindex.ai/.
14 | Additionally, we will use the "jinaai/jina-embeddings-v2-base-en" model from HuggingFace to generate text embeddings locally.
15 | Before getting started, update the <code>config.py</code> file as following:
16 |     "DEEPINFRA_API_KEY"="<your_api_key>"    
17 |     "LLAMAPARSE_API_KEY"="<your_api_key>"


--------------------------------------------------------------------------------
/end-to-end-use-cases/Contextual-Chunking-RAG/config.py:
--------------------------------------------------------------------------------
1 | LLAMAPARSE_API_KEY=""
2 | DEEPINFRA_API_KEY=""
3 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/Contextual-Chunking-RAG/embedding.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from transformers import AutoTokenizer, AutoModel
 3 | from llama_index.core.base.embeddings.base import BaseEmbedding
 4 | 
 5 | device = "cuda" if torch.cuda.is_available() else "cpu"
 6 | 
 7 | # Load tokenizer and model
 8 | model_id = "jinaai/jina-embeddings-v2-base-en" #"jinaai/jina-embeddings-v3"
 9 | tokenizer = AutoTokenizer.from_pretrained(model_id)
10 | model = AutoModel.from_pretrained(model_id, trust_remote_code=True).to(device)
11 | 
12 | # Define function to generate embeddings
13 | def get_embedding(text):
14 |     inputs = tokenizer(text, return_tensors="pt", truncation=True, padding=True).to(device)
15 |     with torch.no_grad():
16 |         outputs = model(**inputs)    
17 |     return outputs.last_hidden_state.mean(dim=1).squeeze().cpu().numpy() #.to(torch.float32)
18 | 
19 | 
20 | class LocalJinaEmbedding(BaseEmbedding):
21 |     def __init__(self):
22 |         super().__init__()
23 | 
24 |     def _get_text_embedding(self, text):
25 |         return get_embedding(text).tolist()  # Ensure compatibility with LlamaIndex
26 | 
27 |     def _get_query_embedding(self, query):
28 |         return get_embedding(query).tolist()
29 |     
30 |     async def _aget_query_embedding(self, query: str) -> list:
31 |         return get_embedding(query).tolist()
32 | 
33 | 
34 | 
35 | def test(): #this did not produce reasonable results for some reason
36 |     #!pip install llama-index-embeddings-huggingface
37 |     from llama_index.embeddings.huggingface import HuggingFaceEmbedding 
38 |     embed_model = HuggingFaceEmbedding(model_name=model_id)
39 | 
40 | 
41 | if __name__=="__main__":
42 | 	emb = get_embedding("hi there")
43 | 	print(emb.shape)
44 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/NotebookLlama/requirements.txt:
--------------------------------------------------------------------------------
 1 | # Core dependencies
 2 | PyPDF2>=3.0.0
 3 | torch>=2.0.0
 4 | transformers>=4.46.0
 5 | accelerate>=0.27.0
 6 | rich>=13.0.0
 7 | ipywidgets>=8.0.0
 8 | tqdm>=4.66.0
 9 | 
10 | # Optional but recommended
11 | jupyter>=1.0.0
12 | ipykernel>=6.0.0
13 | 
14 | # Warning handling
15 | warnings>=0.1.0


--------------------------------------------------------------------------------
/end-to-end-use-cases/NotebookLlama/resources/2402.13116v4.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/NotebookLlama/resources/2402.13116v4.pdf


--------------------------------------------------------------------------------
/end-to-end-use-cases/NotebookLlama/resources/Outline.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/NotebookLlama/resources/Outline.jpg


--------------------------------------------------------------------------------
/end-to-end-use-cases/NotebookLlama/resources/_podcast.mp3:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/NotebookLlama/resources/_podcast.mp3


--------------------------------------------------------------------------------
/end-to-end-use-cases/NotebookLlama/resources/data.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/NotebookLlama/resources/data.pkl


--------------------------------------------------------------------------------
/end-to-end-use-cases/NotebookLlama/resources/podcast_ready_data.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/NotebookLlama/resources/podcast_ready_data.pkl


--------------------------------------------------------------------------------
/end-to-end-use-cases/RAFT-Chatbot/config.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | import yaml
 5 | 
 6 | def load_config(config_path: str = "./config.yaml"):
 7 |     # Read the YAML configuration file
 8 |     with open(config_path, "r") as file:
 9 |         config = yaml.safe_load(file)
10 |     return config
11 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/RAFT-Chatbot/images/Answers_Precision.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/RAFT-Chatbot/images/Answers_Precision.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/RAFT-Chatbot/images/LLM_score_comparison.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/RAFT-Chatbot/images/LLM_score_comparison.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/RAFT-Chatbot/images/Num_of_refusal_comparison.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/RAFT-Chatbot/images/Num_of_refusal_comparison.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/RAFT-Chatbot/images/RAFT.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/RAFT-Chatbot/images/RAFT.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/agents/DeepLearningai_Course_Notebooks/README.md:
--------------------------------------------------------------------------------
 1 | # Quickstart Llama 3 Powered Agent Examples Ported from DeepLearning.ai Short Courses
 2 | 
 3 | The notebooks in this folder are ported from the 4 recent agent short courses on [Deeplearning.ai](https://www.deeplearning.ai) to use Llama 3 to build agent apps from scratch or with open source frameworks (LangChain, LlamaIndex, AutoGen).
 4 | 
 5 | 1. [Functions Tools and Agents with LangChain L1 Function Calling](Functions_Tools_and_Agents_with_LangChain_L1_Function_Calling.ipynb)
 6 | 
 7 | 2. [AI Agents in LangGraph L1 Build an Agent from Scratch](AI_Agents_in_LangGraph_L1_Build_an_Agent_from_Scratch.ipynb)
 8 | 
 9 | 3. [Building Agentic RAG with Llamaindex L1 Router Engine](Building_Agentic_RAG_with_Llamaindex_L1_Router_Engine.ipynb)
10 | 
11 | 4. [AI Agentic Design Patterns with AutoGen L4 Tool Use and Conversational Chess](AI_Agentic_Design_Patterns_with_AutoGen_L4_Tool_Use_and_Conversational_Chess.ipynb)
12 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/agents/README.md:
--------------------------------------------------------------------------------
1 | ## Agents and Tool Calling
2 | 
3 | Structure:
4 | 
5 | - Agents_Tutorial: Showcases 101 and 201 notebooks guidance for using tool calling with Llama models
6 | - DeepLearning_Course_Notebooks: Notebooks from the DL.ai course teaching Agents


--------------------------------------------------------------------------------
/end-to-end-use-cases/agents/calendar_assistant/assets/flow_diagram.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/agents/calendar_assistant/assets/flow_diagram.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/agents/calendar_assistant/assets/google_calendar.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/agents/calendar_assistant/assets/google_calendar.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/README.md:
--------------------------------------------------------------------------------
1 | # Benchmarks
2 | 
3 | * inference - a folder contains benchmark scripts that apply a throughput analysis for Llama models inference on various backends including on-prem, cloud and on-device.
4 | * llm_eval_harness - a folder that introduces `lm-evaluation-harness`, a tool to evaluate Llama models including quantized models focusing on quality. We also included a recipe that calculates Llama 3.1 evaluation metrics Using `lm-evaluation-harness` and instructions that calculate HuggingFace Open LLM Leaderboard v2 metrics.
5 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/evals_synthetic_data/Workflow_Diagram.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/benchmarks/evals_synthetic_data/Workflow_Diagram.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/evals_synthetic_data/generated_data/tabular_data.csv:
--------------------------------------------------------------------------------
 1 | ,start_date,end_date,salary,duration,student_id,high_perc,high_spec,mba_spec,second_perc,gender,degree_perc,placed,experience_years,employability_perc,mba_perc,work_experience,degree_type
 2 | 0,2020-01-10,,,3.0,3040587,66.62,Science,Mkt&Fin,75.01,M,75.76,True,1,85.98,58.37,True,Sci&Tech
 3 | 1,,2020-11-07,39320.0,,5940200,81.61,Commerce,Mkt&HR,73.03,M,67.27,True,1,91.44,65.12,False,Comm&Mgmt
 4 | 2,2020-02-21,2020-07-08,36408.0,3.0,13408830,62.71,Arts,Mkt&Fin,82.09,F,71.97,True,1,62.18,71.15,True,Comm&Mgmt
 5 | 3,2020-01-30,2020-09-29,36591.0,3.0,16186310,51.0,Commerce,Mkt&Fin,62.04,M,65.32,True,1,61.87,58.9,False,Comm&Mgmt
 6 | 4,2020-01-16,,33032.0,,2086931,67.04,Commerce,Mkt&Fin,53.53,M,51.08,True,1,58.65,56.32,False,Sci&Tech
 7 | 5,2020-07-20,,31536.0,3.0,6414765,80.3,Science,Mkt&HR,87.34,M,74.1,True,1,64.24,68.55,False,Sci&Tech
 8 | 6,2020-02-13,2020-11-26,32428.0,12.0,6180804,67.61,Commerce,Mkt&HR,49.94,M,72.79,True,1,86.51,69.26,False,Sci&Tech
 9 | 7,2020-01-02,2020-07-14,36317.0,6.0,14357765,63.09,Commerce,Mkt&Fin,86.17,M,83.25,True,1,71.89,75.9,False,Sci&Tech
10 | 8,,2020-05-10,27104.0,3.0,9499396,77.42,Science,Mkt&HR,71.74,F,66.19,False,1,95.38,59.49,False,Sci&Tech
11 | 9,2020-01-01,2020-04-15,,3.0,10945558,57.54,Science,Mkt&HR,57.63,F,72.51,True,1,86.4,60.99,True,Comm&Mgmt
12 | 10,2020-01-01,2020-10-27,,6.0,5714925,82.43,Science,Mkt&Fin,68.14,M,76.55,True,1,95.86,67.78,False,Sci&Tech
13 | 11,2020-01-01,2020-07-02,,3.0,12273151,58.25,Commerce,Mkt&Fin,65.04,M,61.35,True,1,65.73,55.15,True,Comm&Mgmt
14 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/inference/cloud/aws/fmbench/img/CFT.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/benchmarks/inference/cloud/aws/fmbench/img/CFT.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/inference/cloud/aws/fmbench/img/business_summary.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/benchmarks/inference/cloud/aws/fmbench/img/business_summary.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/inference/cloud/aws/fmbench/img/instances.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/benchmarks/inference/cloud/aws/fmbench/img/instances.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/inference/cloud/aws/fmbench/img/latency_vs_tokens.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/benchmarks/inference/cloud/aws/fmbench/img/latency_vs_tokens.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/inference/cloud/azure/parameters.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "MAX_NEW_TOKEN" : 256,
 3 |     "CONCURRENT_LEVELS" : [1, 2, 4, 8, 16, 32, 64],
 4 |     "THRESHOLD_TPS" : 7,
 5 |     "MODEL_PATH" : "meta-llama/your-model-path",
 6 |     "RANDOM_PROMPT_LENGTH" : 25,
 7 |     "TEMPERATURE" : 0.6,
 8 |     "TOP_P" : 0.9,
 9 |     "MODEL_ENDPOINTS" : "https://your-endpoint.inference.ai.azure.com/v1/chat/completions",
10 |     "API_KEY" : "your-auth-key",
11 |     "SYS_PROMPT" : "You are a helpful assistant."
12 | }


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/inference/on_prem/vllm/parameters.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "MAX_NEW_TOKENS" : 256,
 3 |     "CONCURRENT_LEVELS" : [1, 2, 4, 8, 16, 32, 64, 128, 256],
 4 |     "MODEL_PATH" : "meta-llama/your-model-path",
 5 |     "MODEL_HEADERS" : {"Content-Type": "application/json"},
 6 |     "SAFE_CHECK" : true,
 7 |     "THRESHOLD_TPS" : 7,
 8 |     "RANDOM_PROMPT_LENGTH" : 1000,
 9 |     "TEMPERATURE" : 0.6,
10 |     "TOP_P" : 0.9,
11 |     "MODEL_ENDPOINTS" : [
12 |         "http://localhost:8000/v1/chat/completions"
13 |     ]
14 | }
15 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/inference/requirements.txt:
--------------------------------------------------------------------------------
1 | transformers
2 | requests
3 | azure-core
4 | azure-ai-contentsafety
5 | torch
6 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/bbh/bbh_3shot_cot.yaml:
--------------------------------------------------------------------------------
 1 | dataset_path: meta-llama/Llama-3.1-8B-evals
 2 | dataset_name: Llama-3.1-8B-evals__bbh__details
 3 | task: meta_bbh
 4 | output_type: generate_until
 5 | process_docs: !function utils.process_docs
 6 | test_split: latest
 7 | doc_to_text: !function utils.doc_to_text
 8 | doc_to_target: answer
 9 | filter_list:
10 |   - name: "strict-match"
11 |     filter:
12 |       - function: "regex"
13 |         regex_pattern: 'the answer is (.*?)\.'
14 |       - function: "take_first"
15 | generation_kwargs:
16 |   until: "\n\nQ: "
17 |   do_sample: false
18 |   temperature: 0
19 |   max_gen_toks: 512
20 | num_fewshot: 0
21 | metric_list:
22 |   - metric: exact_match
23 |     aggregation: mean
24 |     higher_is_better: true
25 |     ignore_case: true
26 |     ignore_punctuation: true
27 | metadata:
28 |   version: 1.0
29 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/bbh/utils.py:
--------------------------------------------------------------------------------
 1 | import random
 2 | import re
 3 | 
 4 | import datasets
 5 | 
 6 | 
 7 | 
 8 | def doc_to_text(doc: dict) -> str:
 9 |     return doc["input_final_prompts"][0]
10 | 
11 | def process_docs(dataset: datasets.Dataset) -> datasets.Dataset:
12 |     def _process_doc(doc: dict) -> dict:
13 |         out_doc = {
14 |             "problem": doc["input_question"],
15 |             "answer": doc["input_correct_responses"][0],
16 |         }
17 |         return out_doc
18 |     dataset = dataset.select_columns(["input_question", "input_correct_responses", "input_final_prompts", "is_correct","input_question_hash","output_prediction_text"])
19 |     dataset = dataset.rename_column("is_correct","previously_is_correct")
20 |     dataset = dataset.map(_process_doc)
21 |     return dataset.map(_process_doc)
22 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/gpqa/gpqa_0shot.yaml:
--------------------------------------------------------------------------------
 1 | dataset_path: meta-llama/Llama-3.1-8B-Instruct-evals
 2 | dataset_name: Llama-3.1-8B-Instruct-evals__gpqa__details
 3 | task: meta_gpqa
 4 | output_type: generate_until
 5 | process_docs: !function utils.process_docs
 6 | test_split: latest
 7 | doc_to_text: !function utils.doc_to_text
 8 | doc_to_target: gold
 9 | filter_list:
10 |   - name: "strict-match"
11 |     filter:
12 |       - function: "regex"
13 |         group_select: -1
14 |         regex_pattern: ' ([A-Z])'
15 |       - function: "take_first"
16 | generation_kwargs:
17 |   until: []
18 |   do_sample: false
19 |   temperature: 0
20 |   max_gen_toks: 2048
21 | num_fewshot: 0
22 | metric_list:
23 |   - metric: exact_match
24 |     aggregation: mean
25 |     higher_is_better: true
26 |     ignore_case: true
27 |     ignore_punctuation: true
28 | metadata:
29 |   version: 1.0
30 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/gpqa/utils.py:
--------------------------------------------------------------------------------
 1 | import random
 2 | import re
 3 | 
 4 | import datasets
 5 | 
 6 | def doc_to_text(doc: dict) -> str:
 7 |     return doc["input_final_prompts"][0]
 8 | 
 9 | def process_docs(dataset: datasets.Dataset) -> datasets.Dataset:
10 |     def _process_doc(doc: dict) -> dict:
11 |         out_doc = {
12 |             "problem": doc["input_question"],
13 |             "gold": doc["input_correct_responses"][0],
14 |         }
15 |         return out_doc
16 |     dataset = dataset.select_columns(["input_question", "input_correct_responses", "input_final_prompts", "is_correct","input_question_hash","input_choice_list","output_prediction_text"])
17 |     dataset = dataset.rename_column("is_correct","previously_is_correct")
18 |     dataset = dataset.map(_process_doc)
19 |     return dataset.map(_process_doc)
20 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/gpqa_cot/gpqa_0shot_cot.yaml:
--------------------------------------------------------------------------------
 1 | dataset_path: meta-llama/Llama-3.1-8B-Instruct-evals
 2 | dataset_name: Llama-3.1-8B-Instruct-evals__gpqa__details
 3 | task: meta_gpqa_cot
 4 | output_type: generate_until
 5 | process_docs: !function utils.process_docs
 6 | test_split: latest
 7 | doc_to_text: !function utils.doc_to_text
 8 | doc_to_target: gold
 9 | filter_list:
10 |   - name: "strict-match"
11 |     filter:
12 |       - function: "regex"
13 |         group_select: -1
14 |         regex_pattern: 'best answer is ([A-Z])'
15 |       - function: "take_first"
16 | generation_kwargs:
17 |   until: []
18 |   do_sample: false
19 |   temperature: 0
20 |   max_gen_toks: 2048
21 | num_fewshot: 0
22 | metric_list:
23 |   - metric: exact_match
24 |     aggregation: mean
25 |     higher_is_better: true
26 |     ignore_case: true
27 |     ignore_punctuation: true
28 | metadata:
29 |   version: 1.0
30 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/gpqa_cot/utils.py:
--------------------------------------------------------------------------------
 1 | import random
 2 | import re
 3 | 
 4 | import datasets
 5 | 
 6 | 
 7 | 
 8 | def doc_to_text(doc: dict) -> str:
 9 |     return doc["input_final_prompts"][0]
10 | def process_docs(dataset: datasets.Dataset) -> datasets.Dataset:
11 |     def _process_doc(doc: dict) -> dict:
12 |         out_doc = {
13 |             "problem": doc["input_question"],
14 |             "gold": doc["input_correct_responses"][0],
15 |         }
16 |         return out_doc
17 |     dataset = dataset.select_columns(["input_question", "input_correct_responses", "input_final_prompts", "is_correct","input_question_hash","input_choice_list","output_prediction_text"])
18 |     dataset = dataset.rename_column("is_correct","previously_is_correct")
19 |     dataset = dataset.map(_process_doc)
20 |     return dataset.map(_process_doc)
21 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/ifeval/ifeval.yaml:
--------------------------------------------------------------------------------
 1 | task: meta_ifeval
 2 | dataset_path: parquet
 3 | dataset_kwargs:
 4 |   data_files: ./work_dir/joined_ifeval.parquet
 5 | output_type: generate_until
 6 | test_split: train
 7 | num_fewshot: 0
 8 | doc_to_text: prompt
 9 | doc_to_target: 0
10 | generation_kwargs:
11 |   until: []
12 |   do_sample: false
13 |   temperature: 0.0
14 |   max_gen_toks: 1280
15 | process_results: !function utils.process_results
16 | metric_list:
17 |   - metric: prompt_level_strict_acc
18 |     aggregation: mean
19 |     higher_is_better: true
20 |   - metric: inst_level_strict_acc
21 |     aggregation: !function utils.agg_inst_level_acc
22 |     higher_is_better: true
23 |   - metric: prompt_level_loose_acc
24 |     aggregation: mean
25 |     higher_is_better: true
26 |   - metric: inst_level_loose_acc
27 |     aggregation: !function utils.agg_inst_level_acc
28 |     higher_is_better: true
29 | metadata:
30 |   version: 2.0
31 | fewshot_config:
32 |   sampler: first_n
33 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/math_hard/math_4shot_cot.yaml:
--------------------------------------------------------------------------------
 1 | dataset_path: parquet
 2 | dataset_kwargs:
 3 |   data_files: ./work_dir/joined_math.parquet
 4 | task: meta_math
 5 | process_docs: !function utils.process_docs
 6 | output_type: generate_until
 7 | test_split: train
 8 | doc_to_text:  !function utils.doc_to_text
 9 | process_results: !function utils.process_results
10 | doc_to_target: answer
11 | generation_kwargs:
12 |   until: []
13 |   do_sample: false
14 |   temperature: 0
15 |   max_gen_toks: 512
16 | metric_list:
17 |   - metric: exact_match
18 |     aggregation: mean
19 |     higher_is_better: true
20 | metadata:
21 |   version: 1.0


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/math_hard/math_hard_0shot_cot.yaml:
--------------------------------------------------------------------------------
 1 | dataset_path: parquet
 2 | dataset_kwargs:
 3 |   data_files: ./work_dir/joined_math_hard.parquet
 4 | task: meta_math_hard
 5 | process_docs: !function utils.process_docs
 6 | output_type: generate_until
 7 | test_split: train
 8 | doc_to_text:  !function utils.doc_to_text
 9 | process_results: !function utils.process_results
10 | doc_to_target: answer
11 | generation_kwargs:
12 |   until: []
13 |   do_sample: false
14 |   temperature: 0
15 |   max_gen_toks: 5120
16 | metric_list:
17 |   - metric: exact_match
18 |     aggregation: mean
19 |     higher_is_better: true
20 | metadata:
21 |   version: 1.0
22 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/meta_instruct.yaml:
--------------------------------------------------------------------------------
1 | group: meta_instruct
2 | task:
3 |   - meta_ifeval
4 |   - meta_math_hard
5 |   - meta_gpqa
6 |   - meta_mmlu_pro_instruct
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/meta_pretrain.yaml:
--------------------------------------------------------------------------------
1 | group: meta_pretrain
2 | task:
3 |   - meta_bbh
4 |   - meta_mmlu_pro_pretrain
5 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/mmlu/mmlu_instruct.yaml:
--------------------------------------------------------------------------------
 1 | task: meta_mmlu_instruct
 2 | dataset_path: meta-llama/Llama-3.1-8B-Instruct-evals
 3 | dataset_name: Llama-3.1-8B-Instruct-evals__mmlu__details
 4 | test_split: latest
 5 | output_type: generate_until
 6 | process_docs: !function utils.process_docs_instruct
 7 | doc_to_text: !function utils.doc_to_text_instruct
 8 | doc_to_target: gold
 9 | filter_list:
10 |   - name: "strict-match"
11 |     filter:
12 |       - function: "regex"
13 |         group_select: -1
14 |         regex_pattern: ' ([A-D])'
15 |       - function: "take_first"
16 | generation_kwargs:
17 |   until: []
18 |   do_sample: false
19 |   temperature: 0
20 |   max_gen_toks: 1024
21 | num_fewshot: 0
22 | metric_list:
23 |   - metric: exact_match
24 |     aggregation: mean
25 |     higher_is_better: true
26 |     ignore_case: true
27 |     ignore_punctuation: true
28 | metadata:
29 |   version: 1.0
30 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/mmlu/mmlu_pretrain.yaml:
--------------------------------------------------------------------------------
 1 | task: meta_mmlu
 2 | dataset_path: meta-llama/Llama-3.1-8B-evals
 3 | dataset_name: Llama-3.1-8B-evals__mmlu__details
 4 | test_split: latest
 5 | output_type: multiple_choice
 6 | process_docs: !function utils.process_docs_pretrain
 7 | doc_to_text: !function utils.doc_to_text_pretrain
 8 | doc_to_target: !function utils.doc_to_target
 9 | doc_to_choice: ["A", "B", "C", "D"]
10 | # 5-shot prompts are already included in the dataset
11 | # So no need to generate
12 | num_fewshot: 0
13 | metadata:
14 |   version: 1.0
15 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/mmlu_pro/mmlu_pro_5shot_cot_instruct.yaml:
--------------------------------------------------------------------------------
 1 | task: meta_mmlu_pro_instruct
 2 | dataset_path: meta-llama/Llama-3.1-8B-Instruct-evals
 3 | dataset_name: Llama-3.1-8B-Instruct-evals__mmlu_pro__details
 4 | test_split: latest
 5 | output_type: generate_until
 6 | process_docs: !function utils.process_docs
 7 | doc_to_text: !function utils.doc_to_text
 8 | doc_to_target: gold
 9 | filter_list:
10 |   - name: "strict-match"
11 |     filter:
12 |       - function: "regex"
13 |         group_select: -1
14 |         regex_pattern: 'best answer is ([A-Z])'
15 |       - function: "take_first"
16 | generation_kwargs:
17 |   until: []
18 |   do_sample: false
19 |   temperature: 0
20 |   max_gen_toks: 1024
21 | num_fewshot: 0
22 | metric_list:
23 |   - metric: exact_match
24 |     aggregation: mean
25 |     higher_is_better: true
26 |     ignore_case: true
27 |     ignore_punctuation: true
28 | metadata:
29 |   version: 1.0
30 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/mmlu_pro/mmlu_pro_5shot_cot_pretrain.yaml:
--------------------------------------------------------------------------------
 1 | task: meta_mmlu_pro_pretrain
 2 | dataset_path: meta-llama/Llama-3.1-8B-evals
 3 | dataset_name: Llama-3.1-8B-evals__mmlu_pro__details
 4 | test_split: latest
 5 | output_type: generate_until
 6 | process_docs: !function utils.process_docs
 7 | doc_to_text: !function utils.doc_to_text
 8 | doc_to_target: gold
 9 | filter_list:
10 |   - name: "strict-match"
11 |     filter:
12 |       - function: "regex"
13 |         regex_pattern: 'answer is \(([A-Z])\)'
14 |       - function: "take_first"
15 | generation_kwargs:
16 |   until: "\n\nQ: "
17 |   do_sample: false
18 |   temperature: 0
19 |   max_gen_toks: 512
20 | num_fewshot: 0
21 | metric_list:
22 |   - metric: exact_match
23 |     aggregation: mean
24 |     higher_is_better: true
25 |     ignore_case: true
26 |     ignore_punctuation: true
27 | metadata:
28 |   version: 1.0
29 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/benchmarks/llm_eval_harness/meta_eval/meta_template/mmlu_pro/utils.py:
--------------------------------------------------------------------------------
 1 | import string
 2 | 
 3 | import datasets
 4 | 
 5 | 
 6 | def doc_to_text(doc: dict) -> str:
 7 |     return doc["input_final_prompts"][0]
 8 | 
 9 | 
10 | def process_docs(dataset: datasets.Dataset) -> datasets.Dataset:
11 |     def _process_doc(doc: dict) -> dict:
12 |         out_doc = {
13 |             "problem": doc["input_question"],
14 |             "gold": doc["input_correct_responses"][0],
15 |         }
16 |         return out_doc
17 | 
18 |     dataset = dataset.select_columns(
19 |         [
20 |             "input_question",
21 |             "input_correct_responses",
22 |             "input_final_prompts",
23 |             "is_correct",
24 |             "input_question_hash",
25 |             "input_choice_list",
26 |             "output_prediction_text",
27 |         ]
28 |     )
29 |     dataset = dataset.rename_column("is_correct", "previously_is_correct")
30 |     dataset = dataset.map(_process_doc)
31 |     return dataset.map(_process_doc)
32 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/.gitignore:
--------------------------------------------------------------------------------
 1 | # See https://help.github.com/articles/ignoring-files/ for more about ignoring files.
 2 | 
 3 | # dependencies
 4 | /node_modules
 5 | /.pnp
 6 | .pnp.js
 7 | 
 8 | # testing
 9 | /coverage
10 | 
11 | # production
12 | /build
13 | 
14 | # misc
15 | .DS_Store
16 | .env.local
17 | .env.development.local
18 | .env.test.local
19 | .env.production.local
20 | 
21 | npm-debug.log*
22 | yarn-debug.log*
23 | yarn-error.log*
24 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "bookmind",
 3 |   "version": "0.1.0",
 4 |   "private": true,
 5 |   "dependencies": {
 6 |     "@testing-library/jest-dom": "^5.17.0",
 7 |     "@testing-library/react": "^13.4.0",
 8 |     "@testing-library/user-event": "^13.5.0",
 9 |     "axios": "^1.7.7",
10 |     "force-graph": "^1.49.5",
11 |     "fs": "^0.0.1-security",
12 |     "lottie-react": "^2.4.0",
13 |     "lucide-react": "^0.460.0",
14 |     "react": "^18.3.1",
15 |     "react-dom": "^18.3.1",
16 |     "react-force-graph": "^1.44.7",
17 |     "react-force-graph-2d": "^1.25.8",
18 |     "react-icons": "^4.10.1",
19 |     "react-router-dom": "^7.0.1",
20 |     "react-scripts": "^5.0.1",
21 |     "web-vitals": "^2.1.4"
22 |   },
23 |   "scripts": {
24 |     "start": "react-scripts start",
25 |     "build": "react-scripts build",
26 |     "test": "react-scripts test",
27 |     "eject": "react-scripts eject"
28 |   },
29 |   "eslintConfig": {
30 |     "extends": [
31 |       "react-app",
32 |       "react-app/jest"
33 |     ]
34 |   },
35 |   "browserslist": {
36 |     "production": [
37 |       ">0.2%",
38 |       "not dead",
39 |       "not op_mini all"
40 |     ],
41 |     "development": [
42 |       "last 1 chrome version",
43 |       "last 1 firefox version",
44 |       "last 1 safari version"
45 |     ]
46 |   },
47 |   "devDependencies": {
48 |     "tailwindcss": "^3.4.15"
49 |   }
50 | }
51 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/public/character_relationship.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/book-character-mindmap/public/character_relationship.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/public/chat_interface.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/book-character-mindmap/public/chat_interface.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/public/favicon.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/book-character-mindmap/public/favicon.ico


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/public/index.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | <html lang="en">
 3 |   <head>
 4 |     <meta charset="utf-8" />
 5 |     <link rel="icon" href="%PUBLIC_URL%/favicon.ico" />
 6 |     <meta name="viewport" content="width=device-width, initial-scale=1" />
 7 |     <meta name="theme-color" content="#000000" />
 8 |     <meta
 9 |       name="description"
10 |       content="Web site created using create-react-app"
11 |     />
12 |     <link rel="apple-touch-icon" href="%PUBLIC_URL%/logo192.png" />
13 |     <!--
14 |       manifest.json provides metadata used when your web app is installed on a
15 |       user's mobile device or desktop. See https://developers.google.com/web/fundamentals/web-app-manifest/
16 |     -->
17 |     <link rel="manifest" href="%PUBLIC_URL%/manifest.json" />
18 |     <!--
19 |       Notice the use of %PUBLIC_URL% in the tags above.
20 |       It will be replaced with the URL of the `public` folder during the build.
21 |       Only files inside the `public` folder can be referenced from the HTML.
22 | 
23 |       Unlike "/favicon.ico" or "favicon.ico", "%PUBLIC_URL%/favicon.ico" will
24 |       work correctly both with client-side routing and a non-root public URL.
25 |       Learn how to configure a non-root public URL by running `npm run build`.
26 |     -->
27 |     <title>React App</title>
28 |   </head>
29 |   <body>
30 |     <noscript>You need to enable JavaScript to run this app.</noscript>
31 |     <div id="root"></div>
32 |     <!--
33 |       This HTML file is a template.
34 |       If you open it directly in the browser, you will see an empty page.
35 | 
36 |       You can add webfonts, meta tags, or analytics to this file.
37 |       The build step will place the bundled scripts into the <body> tag.
38 | 
39 |       To begin the development, run `npm start` or `yarn start`.
40 |       To create a production bundle, use `npm run build` or `yarn build`.
41 |     -->
42 |   </body>
43 | </html>
44 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/public/logo192.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/book-character-mindmap/public/logo192.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/public/logo512.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/book-character-mindmap/public/logo512.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/public/manifest.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "short_name": "React App",
 3 |   "name": "Create React App Sample",
 4 |   "icons": [
 5 |     {
 6 |       "src": "favicon.ico",
 7 |       "sizes": "64x64 32x32 24x24 16x16",
 8 |       "type": "image/x-icon"
 9 |     },
10 |     {
11 |       "src": "logo192.png",
12 |       "type": "image/png",
13 |       "sizes": "192x192"
14 |     },
15 |     {
16 |       "src": "logo512.png",
17 |       "type": "image/png",
18 |       "sizes": "512x512"
19 |     }
20 |   ],
21 |   "start_url": ".",
22 |   "display": "standalone",
23 |   "theme_color": "#000000",
24 |   "background_color": "#ffffff"
25 | }
26 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/public/mindmap.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/book-character-mindmap/public/mindmap.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/public/robots.txt:
--------------------------------------------------------------------------------
1 | # https://www.robotstxt.org/robotstxt.html
2 | User-agent: *
3 | Disallow:
4 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/server/requirements.txt:
--------------------------------------------------------------------------------
1 | flask
2 | flask-cors
3 | asyncio
4 | werkzeug
5 | vllm
6 | transformers
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/src/App.css:
--------------------------------------------------------------------------------
 1 | .App {
 2 |   text-align: center;
 3 | }
 4 | 
 5 | .App-logo {
 6 |   height: 40vmin;
 7 |   pointer-events: none;
 8 | }
 9 | 
10 | @media (prefers-reduced-motion: no-preference) {
11 |   .App-logo {
12 |     animation: App-logo-spin infinite 20s linear;
13 |   }
14 | }
15 | 
16 | .App-header {
17 |   background-color: #282c34;
18 |   min-height: 100vh;
19 |   display: flex;
20 |   flex-direction: column;
21 |   align-items: center;
22 |   justify-content: center;
23 |   font-size: calc(10px + 2vmin);
24 |   color: white;
25 | }
26 | 
27 | .App-link {
28 |   color: #61dafb;
29 | }
30 | 
31 | @keyframes App-logo-spin {
32 |   from {
33 |     transform: rotate(0deg);
34 |   }
35 |   to {
36 |     transform: rotate(360deg);
37 |   }
38 | }
39 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/src/App.js:
--------------------------------------------------------------------------------
 1 | import { BrowserRouter as Router, Routes, Route } from "react-router-dom";
 2 | import Home from "./homePage/index";
 3 | import SearchPage from "./bookPage/components/SearchPage";
 4 | 
 5 | function App() {
 6 |   return (
 7 |     <Router>
 8 |       <Routes>
 9 |         {/* Define routes for Home and SearchPage */}
10 |         <Route path="/" element={<Home />} />
11 |         <Route path="/search" element={<SearchPage />} />
12 |       </Routes>
13 |     </Router>
14 |   );
15 | }
16 | 
17 | export default App;
18 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/src/App.test.js:
--------------------------------------------------------------------------------
1 | import { render, screen } from '@testing-library/react';
2 | import App from './App';
3 | 
4 | test('renders learn react link', () => {
5 |   render(<App />);
6 |   const linkElement = screen.getByText(/learn react/i);
7 |   expect(linkElement).toBeInTheDocument();
8 | });
9 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/src/approuter.jsx:
--------------------------------------------------------------------------------
 1 | /* eslint-disable no-extra-semi */
 2 | /* eslint-disable react/prop-types */
 3 | /* eslint-disable no-unused-vars */
 4 | import { Route, BrowserRouter as Router, Routes } from "react-router-dom";
 5 | 
 6 | import Home from "./pages/homePage";
 7 | import BookPage from "./pages/bookPage";
 8 | 
 9 | const AppRouter = function () {
10 |   return (
11 |     <>
12 |       <Routes>
13 |         <Route exact path="/" element={<Home />} />
14 |         <Route exact path="/search" element={<BookPage />} />
15 |       </Routes>
16 |     </>
17 |   );
18 | };
19 | 
20 | const App = () => (
21 |   <Router>
22 |     <AppRouter />
23 |   </Router>
24 | );
25 | 
26 | export default App;
27 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/src/index.css:
--------------------------------------------------------------------------------
1 | @tailwind base;
2 | @tailwind components;
3 | @tailwind utilities;
4 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/src/index.js:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import ReactDOM from "react-dom/client";
 3 | import "./index.css";
 4 | import AppRouter from "./approuter";
 5 | import reportWebVitals from "./reportWebVitals";
 6 | 
 7 | const root = ReactDOM.createRoot(document.getElementById("root"));
 8 | root.render(<AppRouter />);
 9 | 
10 | // If you want to start measuring performance in your app, pass a function
11 | // to log results (for example: reportWebVitals(console.log))
12 | // or send to an analytics endpoint. Learn more: https://bit.ly/CRA-vitals
13 | reportWebVitals();
14 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/src/pages/Layout.jsx:
--------------------------------------------------------------------------------
 1 | import "../index.css";
 2 | 
 3 | export const metadata = {
 4 |   title: "BookMind - Unravel Stories, One Map at a Time",
 5 |   description:
 6 |     "Explore character relationships and storylines with AI-powered visualizations.",
 7 | };
 8 | 
 9 | export default function RootLayout({ children }) {
10 |   return (
11 |     <html lang="en">
12 |       <head>
13 |         <title>{metadata.title}</title>
14 |         <meta name="description" content={metadata.description} />
15 |       </head>
16 |       <body>{children}</body>
17 |     </html>
18 |   );
19 | }
20 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/src/pages/bookPage/components/ErrorBoundary.jsx:
--------------------------------------------------------------------------------
 1 | 'use client'
 2 | 
 3 | import { Component } from 'react'
 4 | 
 5 | class ErrorBoundary extends Component {
 6 |   constructor(props) {
 7 |     super(props)
 8 |     this.state = { hasError: false }
 9 |   }
10 | 
11 |   static getDerivedStateFromError(error) {
12 |     return { hasError: true }
13 |   }
14 | 
15 |   componentDidCatch(error, errorInfo) {
16 |     console.log('ErrorBoundary caught an error:', error, errorInfo)
17 |   }
18 | 
19 |   render() {
20 |     if (this.state.hasError) {
21 |       return <h1>Something went wrong.</h1>
22 |     }
23 | 
24 |     return this.props.children
25 |   }
26 | }
27 | 
28 | export default ErrorBoundary
29 | 
30 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/src/pages/homePage/index.jsx:
--------------------------------------------------------------------------------
 1 | import Hero from "./components/Hero";
 2 | import Features from "./components/Features";
 3 | import HowItWorks from "./components/HowItWorks";
 4 | 
 5 | export default function Home() {
 6 |   return (
 7 |     <main className="min-h-screen bg-gradient-to-b from-indigo-100 to-white">
 8 |       <Hero />
 9 |       <Features />
10 |       <HowItWorks />
11 |     </main>
12 |   );
13 | }
14 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/src/reportWebVitals.js:
--------------------------------------------------------------------------------
 1 | const reportWebVitals = onPerfEntry => {
 2 |   if (onPerfEntry && onPerfEntry instanceof Function) {
 3 |     import('web-vitals').then(({ getCLS, getFID, getFCP, getLCP, getTTFB }) => {
 4 |       getCLS(onPerfEntry);
 5 |       getFID(onPerfEntry);
 6 |       getFCP(onPerfEntry);
 7 |       getLCP(onPerfEntry);
 8 |       getTTFB(onPerfEntry);
 9 |     });
10 |   }
11 | };
12 | 
13 | export default reportWebVitals;
14 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/src/setupTests.js:
--------------------------------------------------------------------------------
1 | // jest-dom adds custom jest matchers for asserting on DOM nodes.
2 | // allows you to do things like:
3 | // expect(element).toHaveTextContent(/react/i)
4 | // learn more: https://github.com/testing-library/jest-dom
5 | import '@testing-library/jest-dom';
6 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/book-character-mindmap/tailwind.config.js:
--------------------------------------------------------------------------------
 1 | /** @type {import('tailwindcss').Config} */
 2 | module.exports = {
 3 |   content: ["./src/**/*.{js,jsx,ts,tsx}"],
 4 |   theme: {
 5 |     extend: {
 6 |       keyframes: {
 7 |         fadeInUp: {
 8 |           "0%": { opacity: 0, transform: "translateY(20px)" },
 9 |           "100%": { opacity: 1, transform: "translateY(0)" },
10 |         },
11 |         fadeOutDown: {
12 |           "0%": { opacity: 1, transform: "translateY(0)" },
13 |           "100%": { opacity: 0, transform: "translateY(-20px)" },
14 |         },
15 |       },
16 |       animation: {
17 |         fadeInUp: "fadeInUp 0.3s ease-out",
18 |         fadeOutDown: "fadeOutDown 0.3s ease-in",
19 |       },
20 |     },
21 |   },
22 |   plugins: [],
23 | };
24 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/browser_use/README.md:
--------------------------------------------------------------------------------
 1 | ## Building an Intelligent Browser Agent with Llama 4 Scout
 2 | This project provides a comprehensive guide to creating an AI-powered browser agent capable of autonomously navigating and interacting with websites. By leveraging the capabilities of Llama 4 Scout, Playwright, and Together AI, this agent can perform tasks seamlessly while understanding both visual and textual content.
 3 | ### Features
 4 | - Visual Understanding: Utilizes screenshots for visual comprehension of web pages
 5 | - Autonomous Navigation: Capable of navigating and interacting with web elements.
 6 | - Natural Language Instructions: Executes tasks based on natural language commands.
 7 | - Persistent Session Management: Maintains browser sessions for continuous interaction.
 8 | ### Example Tasks
 9 | - Search for a product on Amazon.
10 | - Find the cheapest flight to Tokyo.
11 | - Purchase tickets for the next Warriors game.
12 | ### What's in this Project?
13 | - Environment setup instructions
14 | - Browser automation guides using Playwright
15 | - Structured prompting techniques for guiding the LLM in task execution
16 | - Content comprehension utilizing Llama 4 Scout
17 | - Creating a persistent and intelligent browser agent for real-world applications
18 | ### Demo
19 | For a detailed explanation and demo video, visit: [Blog Post and Demo Video](https://miguelg719.github.io/browser-use-blog/)
20 | ### Prerequisite for Running the Notebook
21 | - Before getting started, please make sure to setup Together.ai and get an API key from [here](https://www.together.ai/). 
22 | ### Collaborators
23 | Feel free to reach out with any questions or feedback!
24 | - Miguel Gonzalez: [X](https://x.com/miguel_gonzf) | [LinkedIn](https://www.linkedin.com/in/gonzalezfernandezmiguel/)
25 | - Dimitry Khorzov: [X](https://x.com/korzhov_dm) | [LinkedIn](https://www.linkedin.com/in/korzhovdm)
26 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/browser_use/agent/sample_screenshot.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/browser_use/agent/sample_screenshot.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/coding/text2sql/csv2db.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | import sqlite3
 5 | import csv
 6 | 
 7 | # Define the input CSV file and the SQLite database file
 8 | input_csv = 'nba_roster.csv'
 9 | database_file = 'nba_roster.db'
10 | 
11 | # Connect to the SQLite database
12 | conn = sqlite3.connect(database_file)
13 | cursor = conn.cursor()
14 | 
15 | # Create a table to store the data
16 | cursor.execute('''CREATE TABLE IF NOT EXISTS nba_roster (
17 |                     Team TEXT,
18 |                     NAME TEXT,
19 |                     Jersey TEXT,
20 |                     POS TEXT,
21 |                     AGE INT,
22 |                     HT TEXT,
23 |                     WT TEXT,
24 |                     COLLEGE TEXT,
25 |                     SALARY TEXT
26 |                 )''')
27 | 
28 | # Read data from the CSV file and insert it into the SQLite table
29 | with open(input_csv, 'r', newline='') as csvfile:
30 |     csv_reader = csv.reader(csvfile)
31 |     next(csv_reader)  # Skip the header row
32 |     
33 |     for row in csv_reader:
34 |         cursor.execute('INSERT INTO nba_roster VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)', row)
35 | 
36 | # Commit the changes and close the database connection
37 | conn.commit()
38 | conn.close()
39 | 
40 | print(f'Data from {input_csv} has been successfully imported into {database_file}')
41 | 
42 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/coding/text2sql/nba_roster.db:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/coding/text2sql/nba_roster.db


--------------------------------------------------------------------------------
/end-to-end-use-cases/coding/text2sql/requirements.txt:
--------------------------------------------------------------------------------
1 | langchain
2 | langchain-community
3 | langchain-together


--------------------------------------------------------------------------------
/end-to-end-use-cases/customerservice_chatbots/RAG_chatbot/data/Llama Getting Started Guide.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/customerservice_chatbots/RAG_chatbot/data/Llama Getting Started Guide.pdf


--------------------------------------------------------------------------------
/end-to-end-use-cases/customerservice_chatbots/RAG_chatbot/requirements.txt:
--------------------------------------------------------------------------------
1 | gradio
2 | pypdf
3 | langchain
4 | sentence-transformers
5 | faiss-cpu
6 | text-generation


--------------------------------------------------------------------------------
/end-to-end-use-cases/customerservice_chatbots/RAG_chatbot/vectorstore/db_faiss/index.faiss:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/customerservice_chatbots/RAG_chatbot/vectorstore/db_faiss/index.faiss


--------------------------------------------------------------------------------
/end-to-end-use-cases/customerservice_chatbots/RAG_chatbot/vectorstore/db_faiss/index.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/customerservice_chatbots/RAG_chatbot/vectorstore/db_faiss/index.pkl


--------------------------------------------------------------------------------
/end-to-end-use-cases/customerservice_chatbots/messenger_chatbot/llama_messenger.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 3 Community License Agreement.
 3 | 
 4 | import langchain
 5 | from langchain.llms import Replicate
 6 | 
 7 | from flask import Flask
 8 | from flask import request
 9 | import os
10 | import requests
11 | import json
12 | 
13 | os.environ["REPLICATE_API_TOKEN"] = "<your replicate api token>"
14 | llama3_8b_chat = "meta/meta-llama-3-8b-instruct"
15 | 
16 | llm = Replicate(
17 |     model=llama3_8b_chat,
18 |     model_kwargs={"temperature": 0.0, "top_p": 1, "max_new_tokens":500}
19 | )
20 | 
21 | app = Flask(__name__)
22 | 
23 | @app.route('/msgrcvd_pager', methods=['POST', 'GET'])
24 | def msgrcvd_pager():    
25 |     message = request.args.get('message')
26 |     sender = request.args.get('sender')
27 |     recipient = request.args.get('recipient')
28 | 
29 |     answer = llm(message)
30 |     print(message)
31 |     print(answer)
32 | 
33 |     url = f"https://graph.facebook.com/v18.0/{recipient}/messages"
34 |     params = {
35 |         'recipient': '{"id": ' + sender + '}',
36 |         'message': json.dumps({'text': answer}),
37 |         'messaging_type': 'RESPONSE',
38 |         'access_token': "<your page access token>"
39 |     }
40 |     headers = {
41 |         'Content-Type': 'application/json'
42 |     }
43 |     response = requests.post(url, params=params, headers=headers)
44 |     print(response.status_code)
45 |     print(response.text)
46 | 
47 |     return message + "<p/>" + answer
48 | 
49 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/email_agent/1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/email_agent/1.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/email_agent/2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/email_agent/2.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/email_agent/3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/email_agent/3.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/email_agent/email_agent.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/email_agent/email_agent.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/email_agent/main.py:
--------------------------------------------------------------------------------
 1 | import argparse
 2 | import email_agent
 3 | from email_agent import *
 4 | from functions_prompt import system_prompt
 5 | 
 6 | 
 7 | def main():
 8 |     parser = argparse.ArgumentParser(description="Set email address")
 9 |     parser.add_argument("--email", type=str, required=True, help="Your Gmail address")
10 |     args = parser.parse_args()
11 | 
12 |     email_agent.set_email_service(args.email)
13 | 
14 |     greeting = llama31("hello", "Your name is Email Agent, an assistant that can perform all email related tasks for your user.")
15 |     agent_response = f"{greeting}\n\nYour ask: "
16 |     agent = Agent(system_prompt)
17 | 
18 |     while True:
19 |         ask = input(agent_response)
20 |         if ask == "bye":
21 |             print(llama31("bye"))
22 |             break
23 |         print("\n-------------------------\nCalling Llama...")
24 |         agent(ask)
25 |         agent_response = "Your ask: "
26 | 
27 | 
28 | if __name__ == "__main__":
29 |     main()
30 | 
31 | 
32 | 
33 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/email_agent/requirements.txt:
--------------------------------------------------------------------------------
1 | 
2 | google-auth==2.27.0
3 | google-auth-oauthlib==0.4.6
4 | google-auth-httplib2==0.1.0
5 | google-api-python-client==2.34.0
6 | pytz
7 | beautifulsoup4
8 | ollama
9 | pypdf


--------------------------------------------------------------------------------
/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/overview.csv:
--------------------------------------------------------------------------------
1 | repo_name,start_date,end_date,issues_created,open_discussion,closed_discussion,open_no_discussion,closed_no_discussion,open_questions,executive_summary,sentiment_count_negative,sentiment_count_neutral,sentiment_count_positive,severity_count_major,severity_count_minor,severity_count_critical,op_expertise_count_advanced,op_expertise_count_intermediate,themes_count_model_loading,themes_count_model_fine_tuning_and_training,themes_count_model_inference,themes_count_distributed_training_and_multi_gpu,themes_count_performance_and_optimization,themes_count_quantization_and_mixed_precision,themes_count_documentation,themes_count_cuda_compatibility,themes_count_model_evaluation_and_benchmarking,themes_count_miscellaneous
2 | pytorch/pytorch,2024-08-28,2024-08-28,26,8,0,18,0,"['What is the root cause of the performance regression in AMP static shape default wrapper with multiple threads on CPU?', 'How can we improve the naming and commenting scheme for triton fusion ops with custom triton kernel?', 'What is the impact of the security vulnerabilities in the protobuf version used by PyTorch?']","The PyTorch repository is facing various challenges, including performance regressions, compatibility issues, and security vulnerabilities. These issues are affecting different aspects of the project, such as tensor parallelism, autograd, and CUDA support. To address these challenges, the team needs to prioritize and tackle the root causes, which include missing optimized ops, incompatible backend combinations, and insufficient testing coverage.",17,7,2,21,4,1,21,5,3,3,3,3,5,1,1,2,1,14
3 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/commits.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/commits.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/engagement_sankey.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/engagement_sankey.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/expertise.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/expertise.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/sentiment.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/sentiment.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/severity.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/severity.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/themes.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/plots/themes.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/report.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/github_triage/output/pytorch/pytorch/2024-08-28_2024-08-28/report.pdf


--------------------------------------------------------------------------------
/end-to-end-use-cases/github_triage/requirements.txt:
--------------------------------------------------------------------------------
1 | kaleido
2 | plotly
3 | openai
4 | groq
5 | fpdf
6 | plotly
7 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/long_context/H2O/requirements.txt:
--------------------------------------------------------------------------------
1 | transformers
2 | rouge
3 | xopen
4 | needlehaystack


--------------------------------------------------------------------------------
/end-to-end-use-cases/long_context/H2O/src/streaming.sh:
--------------------------------------------------------------------------------
 1 | method=$1
 2 | if [[ ${method} == 'h2o' ]]; then
 3 |     python -u run_streaming.py \
 4 |         --input-path data \
 5 |         --model-name lmsys/vicuna-13b-v1.5 \
 6 |         --enable_h2o_generation \
 7 |         --num_heavy_hitter_tokens 2048 \
 8 |         --num_window_length 4096 \
 9 |         --enable_position_rolling
10 | elif [[ ${method} == 'full' ]]; then
11 |     python -u run_streaming.py \
12 |         --input-path data \
13 |         --model-name lmsys/vicuna-13b-v1.5
14 | else
15 |     echo 'unknown argument for method'
16 | fi
17 | 
18 | 
19 | 
20 | 
21 | 
22 | 
23 | 
24 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/multilingual/img/phase1_eval_loss.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/multilingual/img/phase1_eval_loss.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/multilingual/img/phase1_train_loss.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/multilingual/img/phase1_train_loss.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/multilingual/img/phase2_eval_loss.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/multilingual/img/phase2_eval_loss.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/multilingual/img/phase2_train_loss.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/end-to-end-use-cases/multilingual/img/phase2_train_loss.png


--------------------------------------------------------------------------------
/end-to-end-use-cases/multilingual/prepare_data.py:
--------------------------------------------------------------------------------
 1 | import fire
 2 | import os
 3 | from datasets import load_dataset
 4 | 
 5 | DATASET = "rahular/varta"
 6 | 
 7 | def main(split="validation", lang="hi", docs_to_sample=10_000, save_path="data"):
 8 |     dataset = load_dataset(DATASET, split=split, streaming=True)
 9 |     os.makedirs(save_path, exist_ok=True)
10 |     with open(os.path.join(save_path, f"{lang}.txt"), "w") as f:
11 |         count = 0
12 |         for idx, d in enumerate(dataset):
13 |             if idx % 10_000 == 0:
14 |                 print(f"Searched {idx} documents for {lang} documents. Found {count} documents.")
15 |             if count >= docs_to_sample:
16 |                 break
17 |             if d["langCode"] == lang:
18 |                 f.write(d["headline"] + "\n" + d["text"] + "\n")
19 |                 count += 1
20 | 
21 | 
22 | if __name__ == "__main__":
23 |     fire.Fire(main)


--------------------------------------------------------------------------------
/end-to-end-use-cases/multilingual/train_tokenizer.py:
--------------------------------------------------------------------------------
 1 | import fire
 2 | import os
 3 | import sentencepiece as spm
 4 | 
 5 | def main(data_file, save_path, vocab_size=16_000, num_threads=8):
 6 |     os.makedirs(save_path, exist_ok=True)
 7 |     tokenizer_name = os.path.join(save_path, "tokenizer")
 8 |     
 9 |     spm.SentencePieceTrainer.train(
10 |         input=data_file,
11 |         model_prefix=tokenizer_name,
12 |         vocab_size=vocab_size,
13 |         num_threads=num_threads,
14 |         model_type="bpe",
15 |         max_sentence_length=1073741824,
16 |         shuffle_input_sentence="true",
17 |         character_coverage=1.0,
18 |         hard_vocab_limit="false",
19 |     )
20 | 
21 | if __name__ == "__main__":
22 |     fire.Fire(main)
23 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/research_paper_analyzer/README.md:
--------------------------------------------------------------------------------
 1 | # Research Paper analyzer with Llama4 Maverick
 2 | 
 3 | This leverages **Llama 4 Maverick** model to retrieve the references of an arXiv paper and ingest all their content for question-answering without using any RAG to store these information.
 4 | 
 5 | ## Features
 6 | 
 7 | ### Leverage Long Context Length
 8 | | Model | Meta Llama4 Maverick | Meta Llama4 Scout | OpenAI GPT-4.5 | Claude Sonnet 3.7 |
 9 | | ----- | -------------- | -------------- | -------------- | -------------- |
10 | | Context Window | 1M tokens | 10M tokens | 128K tokens | 1K tokens | 200K tokens |
11 | 
12 | Because of the long context length, the analyzer can process all the reference paper content at once, so you can ask questions about the paper without worrying about the context length.
13 | 
14 | 
15 | ## Getting Started
16 | 
17 | 1. Install dependencies:
18 | 
19 | ```
20 | pip install -r requirements.txt
21 | ```
22 | 
23 | 2. Run the application:
24 | 
25 | ```
26 | python research_analyzer.py
27 | ```
28 | 
29 | 3. Open the gradio interface on localhost in the browser. 
30 | 
31 | 3. Provide a paper url such as https://arxiv.org/abs/2305.11135
32 | 
33 | 4. Press "Ingest", wait for paper to be processed and ask questions about it
34 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/research_paper_analyzer/requirements.txt:
--------------------------------------------------------------------------------
1 | gradio
2 | together
3 | requests
4 | pypdf2
5 | gradio
6 | 


--------------------------------------------------------------------------------
/end-to-end-use-cases/whatsapp_llama_4_bot/.env:
--------------------------------------------------------------------------------
 1 | # WhatsApp Business Phone Number ID (NOT the phone number itself)
 2 | PHONE_NUMBER_ID="place your whatsapp phone number id"
 3 | 
 4 | # Full URL to send WhatsApp messages (use correct version and phone number ID)
 5 | WHATSAPP_API_URL="place graphql request i.e. https://graph.facebook.com/v{version}/{phone_number_id}/messages"
 6 | 
 7 | # Your custom backend/agent endpoint (e.g., for LLM-based processing)
 8 | AGENT_URL=https://your-agent-url.com/api
 9 | 
10 | LLAMA_API_KEY="place your LLAMA API Key"
11 | 
12 | TOGETHER_API_KEY="place your Together API Key, In case you want to use Together, instead of Llama APIs"
13 | 
14 | GROQ_API_KEY="place your Groq API Key - this is for SST and TTS"
15 | 
16 | OPENAI_API_KEY="place your OpenAI Ke to run the client"
17 | 
18 | META_ACCESS_TOKEN="please your WhatsApp generated Access token from the app"


--------------------------------------------------------------------------------
/end-to-end-use-cases/whatsapp_llama_4_bot/ec2_endpoints.py:
--------------------------------------------------------------------------------
 1 | from fastapi import FastAPI, HTTPException 
 2 | from fastapi.responses import FileResponse
 3 | from pydantic import BaseModel
 4 | from typing import Optional
 5 | from service import text_to_speech, get_llm_response, handle_image_message,handle_audio_message,send_audio_message
 6 | from enum import Enum
 7 | app = FastAPI()
 8 | 
 9 | class TextToSpeechRequest(BaseModel):
10 |     text: str
11 |     output_path: Optional[str] = "reply.mp3"
12 | 
13 | class TextToSpeechResponse(BaseModel):
14 |     file_path: Optional[str]
15 |     error: Optional[str] = None
16 | 
17 | class KindEnum(str, Enum):
18 |     audio = "audio"
19 |     image = "image"
20 | 
21 | class LLMRequest(BaseModel):
22 |     user_input: str
23 |     media_id: Optional[str] = None
24 |     kind: Optional[KindEnum] = None
25 | 
26 | 
27 | class LLMResponse(BaseModel):
28 |     response: Optional[str]
29 |     error: Optional[str] = None
30 | 
31 | @app.post("/llm-response", response_model=LLMResponse)
32 | async def api_llm_response(req: LLMRequest):
33 |     text_message = req.user_input
34 |     image_base64 = None
35 |     if req.kind == KindEnum.image:
36 |         image_base64 = await handle_image_message(req.media_id)
37 |         result = get_llm_response(text_message, image_input=image_base64)
38 |         # print(result)
39 |     elif req.kind == KindEnum.audio:
40 |         text_message = await handle_audio_message(req.media_id)
41 |         result = get_llm_response(text_message)
42 |         audio_path = text_to_speech(text=result, output_path="reply.mp3")
43 |         return FileResponse(audio_path, media_type="audio/mpeg", filename="reply.mp3")
44 |     else:
45 |         result = get_llm_response(text_message)
46 |     
47 |     if result is None:
48 |         return LLMResponse(response=None, error="LLM response generation failed.")
49 |     return LLMResponse(response=result)


--------------------------------------------------------------------------------
/end-to-end-use-cases/whatsapp_llama_4_bot/requirements.txt:
--------------------------------------------------------------------------------
 1 | aiohappyeyeballs==2.6.1
 2 | aiohttp==3.11.16
 3 | aiosignal==1.3.2
 4 | annotated-types==0.7.0
 5 | anyio==4.9.0
 6 | async-timeout==5.0.1
 7 | attrs==25.3.0
 8 | certifi==2025.1.31
 9 | charset-normalizer==3.4.1
10 | click==8.1.8
11 | colorama==0.4.6
12 | distro==1.9.0
13 | dotenv==0.9.9
14 | eval_type_backport==0.2.2
15 | exceptiongroup==1.2.2
16 | fastapi==0.115.12
17 | filelock==3.18.0
18 | frozenlist==1.5.0
19 | groq==0.22.0
20 | h11==0.14.0
21 | httpcore==1.0.8
22 | httpx==0.28.1
23 | idna==3.10
24 | markdown-it-py==3.0.0
25 | mdurl==0.1.2
26 | multidict==6.4.3
27 | numpy==2.2.4
28 | pillow==11.2.1
29 | propcache==0.3.1
30 | pyarrow==19.0.1
31 | pydantic==2.11.3
32 | pydantic_core==2.33.1
33 | Pygments==2.19.1
34 | python-dotenv==1.1.0
35 | requests==2.32.3
36 | rich==13.9.4
37 | shellingham==1.5.4
38 | sniffio==1.3.1
39 | starlette==0.46.2
40 | tabulate==0.9.0
41 | together==1.5.5
42 | tqdm==4.67.1
43 | typer==0.15.2
44 | typing-inspection==0.4.0
45 | typing_extensions==4.13.2
46 | urllib3==2.4.0
47 | uvicorn==0.34.1
48 | yarl==1.19.0


--------------------------------------------------------------------------------
/getting-started/finetuning/finetuning.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
3 | 
4 | import fire
5 | from llama_cookbook.finetuning import main
6 | 
7 | if __name__ == "__main__":
8 |     fire.Fire(main)


--------------------------------------------------------------------------------
/getting-started/finetuning/multi_node.slurm:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | 
 5 | #!/bin/bash
 6 | 
 7 | #SBATCH --job-name=Nano-2d-trainer-20b-8nodes
 8 | 
 9 | #SBATCH --ntasks=2
10 | #SBATCH --nodes=2
11 | #SBATCH --gpus-per-task=4
12 | #SBATCH --partition=train 
13 | nodes=( $( scontrol show hostnames $SLURM_JOB_NODELIST ) )
14 | nodes_array=($nodes)
15 | head_node=${nodes_array[0]}
16 | head_node_ip=$(srun --nodes=1 --ntasks=1 -w "$head_node" hostname --ip-address)
17 | # Enable for A100
18 | export FI_PROVIDER="efa"
19 | 
20 | echo Node IP: $head_node_ip
21 | export LOGLEVEL=INFO
22 | # debugging flags (optional)
23 | export NCCL_DEBUG=WARN
24 | export NCCL_DEBUG_SUBSYS=WARN
25 | export PYTHONFAULTHANDLER=1
26 | export LD_LIBRARY_PATH=/opt/amazon/efa/lib:$LD_LIBRARY_PATH
27 | export LD_LIBRARY_PATH=/usr/local/lib/:$LD_LIBRARY_PATH
28 | export CUDA_LAUNCH_BLOCKING=0
29 | 
30 | # on your cluster you might need these:
31 | # set the network interface
32 | export NCCL_SOCKET_IFNAME="ens"
33 | export FI_EFA_USE_DEVICE_RDMA=1
34 | 
35 | srun  torchrun --nproc_per_node 4 --rdzv_id $RANDOM --rdzv_backend c10d --rdzv_endpoint $head_node_ip:29500 ./finetuning.py  --enable_fsdp --use_peft --peft_method lora
36 | 
37 | 


--------------------------------------------------------------------------------
/getting-started/inference/README.md:
--------------------------------------------------------------------------------
1 | ## Quickstart > Inference
2 | 
3 | This folder contains scripts to get you started with inference on Meta Llama models.
4 | 
5 | * [Local Inference](./local_inference/) contains scripts to do memory efficient inference on servers and local machines
6 | 


--------------------------------------------------------------------------------
/getting-started/inference/local_inference/samsum_prompt.txt:
--------------------------------------------------------------------------------
 1 | Summarize this dialog:
 2 | A: Hi Tom, are you busy tomorrow’s afternoon?
 3 | B: I’m pretty sure I am. What’s up?
 4 | A: Can you go with me to the animal shelter?.
 5 | B: What do you want to do?
 6 | A: I want to get a puppy for my son.
 7 | B: That will make him so happy.
 8 | A: Yeah, we’ve discussed it many times. I think he’s ready now.
 9 | B: That’s good. Raising a dog is a tough issue. Like having a baby ;-) 
10 | A: I'll get him one of those little dogs.
11 | B: One that won't grow up too big;-)
12 | A: And eat too much;-))
13 | B: Do you know which one he would like?
14 | A: Oh, yes, I took him there last Monday. He showed me one that he really liked.
15 | B: I bet you had to drag him away.
16 | A: He wanted to take it home right away ;-).
17 | B: I wonder what he'll name it.
18 | A: He said he’d name it after his dead hamster – Lemmy  - he's  a great Motorhead fan :-)))
19 | ---
20 | Summary:


--------------------------------------------------------------------------------
/getting-started/responsible_ai/README.md:
--------------------------------------------------------------------------------
 1 | # Trust and Safety with Llama
 2 | 
 3 | The [Purple Llama](https://github.com/meta-llama/PurpleLlama/) project provides tools and models to improve LLM security. This folder contains examples to get started with PurpleLlama tools.
 4 | 
 5 | | Tool/Model | Description | Get Started
 6 | |---|---|---|
 7 | [Llama Guard](https://llama.meta.com/docs/model-cards-and-prompt-formats/llama-guard-3) | Provide guardrailing on inputs and outputs | [Inference](./llama_guard/llama_guard_text_and_vision_inference.ipynb), [Finetuning](./llama_guard/llama_guard_customization_via_prompting_and_fine_tuning.ipynb)
 8 | [Prompt Guard](https://llama.meta.com/docs/model-cards-and-prompt-formats/prompt-guard) | Model to safeguards against jailbreak attempts and embedded prompt injections | [Notebook](./prompt_guard/prompt_guard_tutorial.ipynb)
 9 | [Code Shield](https://github.com/meta-llama/PurpleLlama/tree/main/CodeShield) | Tool to safeguard against insecure code generated by the LLM | [Notebook](https://github.com/meta-llama/PurpleLlama/blob/main/CodeShield/notebook/CodeShieldUsageDemo.ipynb)
10 | 
11 | 
12 | 
13 | 


--------------------------------------------------------------------------------
/getting-started/responsible_ai/llama_guard/README.md:
--------------------------------------------------------------------------------
 1 | # Meta Llama Guard demo
 2 | <!-- markdown-link-check-disable -->
 3 | Meta Llama Guard is a language model that provides input and output guardrails for LLM inference. For more details and model cards, please visit the [PurpleLlama](https://github.com/meta-llama/PurpleLlama) repository.
 4 | 
 5 | This [notebook](llama_guard_text_and_vision_inference.ipynb) shows how to load the models with the transformers library and how to customize the categories.
 6 | 
 7 | ## Requirements
 8 | 1. Access to Llama guard model weights on Hugging Face. To get access, follow the steps described in the top of the model card in [Hugging Face](https://huggingface.co/meta-llama/Llama-Guard-3-1B)
 9 | 2. Llama recipes package and its dependencies [installed](https://github.com/meta-llama/llama-cookbook?tab=readme-ov-file#installing)
10 | 3. Pillow package installed
11 | 
12 | ## Inference Safety Checker
13 | When running the regular inference script with prompts, Meta Llama Guard will be used as a safety checker on the user prompt and the model output. If both are safe, the result will be shown, else a message with the error will be shown, with the word unsafe and a comma separated list of categories infringed. Meta Llama Guard is always loaded quantized using Hugging Face Transformers library with bitsandbytes.
14 | 
15 | In this case, the default categories are applied by the tokenizer, using the `apply_chat_template` method.
16 | 
17 | Use this command for testing with a quantized Llama model, modifying the values accordingly:
18 | 
19 | `python inference.py --model_name <path_to_regular_llama_model> --prompt_file <path_to_prompt_file> --enable_llamaguard_content_safety`
20 | 
21 | ## Llama Guard 3 Finetuning & Customization
22 | The safety categories in Llama Guard 3 can be tuned for specific application needs. Existing categories can be removed and new categories can be added to the taxonomy. The [Llama Guard Customization](./llama_guard_customization_via_prompting_and_fine_tuning.ipynb) notebook walks through the process.


--------------------------------------------------------------------------------
/getting-started/responsible_ai/llama_guard/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
3 | 
4 | 


--------------------------------------------------------------------------------
/getting-started/responsible_ai/llama_guard/resources/dog.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/getting-started/responsible_ai/llama_guard/resources/dog.jpg


--------------------------------------------------------------------------------
/getting-started/responsible_ai/llama_guard/resources/pasta.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/getting-started/responsible_ai/llama_guard/resources/pasta.jpeg


--------------------------------------------------------------------------------
/getting-started/responsible_ai/prompt_guard/README.md:
--------------------------------------------------------------------------------
 1 | # Prompt Guard demo
 2 | <!-- markdown-link-check-disable -->
 3 | Prompt Guard is a classifier model that provides input guardrails for LLM inference, particularly against *prompt attacks. For more details and model cards, please visit the main repository, [Meta Prompt Guard](https://github.com/meta-llama/PurpleLlama/tree/main/Prompt-Guard)
 4 | 
 5 | This folder contains an example file to run inference with a locally hosted model, either using the Hugging Face Hub or a local path. It also contains a comprehensive demo demonstrating the scenarios in which the model is effective and a script for fine-tuning the model.
 6 | 
 7 | This is a very small model and inference and fine-tuning are feasible on local CPUs.
 8 | 
 9 | ## Requirements
10 | 1. Access to Prompt Guard model weights on Hugging Face. To get access, follow the steps described [here](https://github.com/facebookresearch/PurpleLlama/tree/main/Prompt-Guard#download)
11 | 2. Llama recipes package and it's dependencies [installed](https://github.com/meta-llama/llama-cookbook?tab=readme-ov-file#installing)
12 | 


--------------------------------------------------------------------------------
/getting-started/responsible_ai/prompt_guard/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/getting-started/responsible_ai/prompt_guard/__init__.py


--------------------------------------------------------------------------------
/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [build-system]
 2 | requires = ["hatchling", "hatch-requirements-txt"]
 3 | build-backend = "hatchling.build"
 4 | 
 5 | [project]
 6 | name = "llama-cookbook"
 7 | version = "0.0.5.post1"
 8 | authors = [
 9 |   { name="Hamid Shojanazeri", email="hamidnazeri@meta.com" },
10 |   { name="Matthias Reso", email="mreso@meta.com" },
11 |   { name="Geeta Chauhan", email="gchauhan@meta.com" },
12 | ]
13 | description = "Llama-cookbook is a companion project to the Llama models. It's goal is to provide examples to quickly get started with fine-tuning for domain adaptation and how to run inference for the fine-tuned models."
14 | readme = "README.md"
15 | requires-python = ">=3.8"
16 | classifiers = [
17 |     "Programming Language :: Python :: 3",
18 |     "License :: Other/Proprietary License",
19 |     "Operating System :: OS Independent",
20 | ]
21 | dynamic = ["dependencies"]
22 | 
23 | [project.optional-dependencies]
24 | vllm = ["vllm"]
25 | tests = ["pytest-mock"]
26 | auditnlg = ["auditnlg"]
27 | langchain = ["langchain_openai", "langchain", "langchain_community"]
28 | 
29 | [project.urls]
30 | "Homepage" = "https://github.com/meta-llama/llama-cookbook"
31 | "Bug Tracker" = "https://github.com/meta-llama/llama-cookbook/issues"
32 | 
33 | [tool.hatch.build]
34 | exclude = [
35 |   "dist/*",
36 | ]
37 | 
38 | [tool.hatch.build.targets.wheel]
39 | packages = ["src/llama_cookbook"]
40 | 
41 | [tool.hatch.metadata.hooks.requirements_txt]
42 | files = ["requirements.txt"]
43 | 
44 | [tool.pytest.ini_options]
45 | markers = [
46 |     "skip_missing_tokenizer: skip tests when we can not access meta-llama/Llama-2-7b-hf on huggingface hub (Log in with `huggingface-cli login` to unskip).",
47 | ]
48 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
 1 | torch>=2.2
 2 | accelerate
 3 | appdirs
 4 | loralib
 5 | bitsandbytes
 6 | black
 7 | black[jupyter]
 8 | datasets
 9 | fire
10 | peft
11 | transformers>=4.45.1
12 | sentencepiece
13 | py7zr
14 | scipy
15 | optimum
16 | matplotlib
17 | chardet
18 | openai
19 | typing-extensions>=4.8.0
20 | tabulate
21 | evaluate
22 | rouge_score
23 | pyyaml==6.0.1
24 | faiss-gpu; python_version < '3.11'
25 | unstructured[pdf]
26 | sentence_transformers
27 | codeshield
28 | gradio
29 | markupsafe==2.0.1
30 | 


--------------------------------------------------------------------------------
/src/docs/img/WhatApp_Llama4_integration.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/WhatApp_Llama4_integration.jpeg


--------------------------------------------------------------------------------
/src/docs/img/a_colorful_llama_doing_ai_programming.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/a_colorful_llama_doing_ai_programming.jpeg


--------------------------------------------------------------------------------
/src/docs/img/a_llama_dressed_as_a_professional_mountain.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/a_llama_dressed_as_a_professional_mountain.jpeg


--------------------------------------------------------------------------------
/src/docs/img/cat.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/cat.jpeg


--------------------------------------------------------------------------------
/src/docs/img/feature_based_fn.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/feature_based_fn.png


--------------------------------------------------------------------------------
/src/docs/img/feature_based_fn_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/feature_based_fn_2.png


--------------------------------------------------------------------------------
/src/docs/img/full_param_fn.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/full_param_fn.png


--------------------------------------------------------------------------------
/src/docs/img/gnocchi_alla_romana.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/gnocchi_alla_romana.jpeg


--------------------------------------------------------------------------------
/src/docs/img/grocery_shopping_bascket_with_salmon_in_package.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/grocery_shopping_bascket_with_salmon_in_package.jpeg


--------------------------------------------------------------------------------
/src/docs/img/k1.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/k1.jpg


--------------------------------------------------------------------------------
/src/docs/img/k1_resized.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/k1_resized.jpg


--------------------------------------------------------------------------------
/src/docs/img/k2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/k2.jpg


--------------------------------------------------------------------------------
/src/docs/img/k2_resized.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/k2_resized.jpg


--------------------------------------------------------------------------------
/src/docs/img/k3.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/k3.jpg


--------------------------------------------------------------------------------
/src/docs/img/k3_resized.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/k3_resized.jpg


--------------------------------------------------------------------------------
/src/docs/img/k4.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/k4.jpg


--------------------------------------------------------------------------------
/src/docs/img/k4_resized.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/k4_resized.jpg


--------------------------------------------------------------------------------
/src/docs/img/llama-mobile-confirmed.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/llama-mobile-confirmed.png


--------------------------------------------------------------------------------
/src/docs/img/llama-recipes.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/llama-recipes.png


--------------------------------------------------------------------------------
/src/docs/img/llama2_gradio.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/llama2_gradio.png


--------------------------------------------------------------------------------
/src/docs/img/llama2_streamlit.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/llama2_streamlit.png


--------------------------------------------------------------------------------
/src/docs/img/llama2_streamlit2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/llama2_streamlit2.png


--------------------------------------------------------------------------------
/src/docs/img/llama_stack.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/llama_stack.png


--------------------------------------------------------------------------------
/src/docs/img/messenger_api_settings.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/messenger_api_settings.png


--------------------------------------------------------------------------------
/src/docs/img/messenger_llama_arch.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/messenger_llama_arch.jpg


--------------------------------------------------------------------------------
/src/docs/img/meta_release.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/meta_release.png


--------------------------------------------------------------------------------
/src/docs/img/resized_image.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/resized_image.jpg


--------------------------------------------------------------------------------
/src/docs/img/thumbnail_IMG_1329.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/thumbnail_IMG_1329.jpg


--------------------------------------------------------------------------------
/src/docs/img/thumbnail_IMG_1440.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/thumbnail_IMG_1440.jpg


--------------------------------------------------------------------------------
/src/docs/img/thumbnail_IMG_6385.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/thumbnail_IMG_6385.jpg


--------------------------------------------------------------------------------
/src/docs/img/wandb_screenshot.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/wandb_screenshot.png


--------------------------------------------------------------------------------
/src/docs/img/whatsapp_dashboard.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/whatsapp_dashboard.jpg


--------------------------------------------------------------------------------
/src/docs/img/whatsapp_llama_arch.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/meta-llama/llama-cookbook/0f4e671f2ccb794b6017391d10a87f0f2af8a2c9/src/docs/img/whatsapp_llama_arch.jpg


--------------------------------------------------------------------------------
/src/llama_cookbook/configs/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
3 | 
4 | from llama_cookbook.configs.peft import lora_config, llama_adapter_config, prefix_config
5 | from llama_cookbook.configs.fsdp import fsdp_config
6 | from llama_cookbook.configs.training import train_config
7 | from llama_cookbook.configs.wandb import wandb_config
8 | from llama_cookbook.configs.quantization import quantization_config
9 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/configs/datasets.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | from dataclasses import dataclass
 5 | 
 6 | 
 7 | @dataclass
 8 | class samsum_dataset:
 9 |     dataset: str =  "samsum_dataset"
10 |     train_split: str = "train"
11 |     test_split: str = "validation"
12 | 
13 | 
14 | @dataclass
15 | class grammar_dataset:
16 |     dataset: str = "grammar_dataset"
17 |     train_split: str = "src/llama_cookbook/datasets/grammar_dataset/gtrain_10k.csv"
18 |     test_split: str = "src/llama_cookbook/datasets/grammar_dataset/grammar_validation.csv"
19 | 
20 | 
21 | @dataclass
22 | class alpaca_dataset:
23 |     dataset: str = "alpaca_dataset"
24 |     train_split: str = "train"
25 |     test_split: str = "val"
26 |     data_path: str = "src/llama_cookbook/datasets/alpaca_data.json"
27 | 
28 | @dataclass
29 | class custom_dataset:
30 |     dataset: str = "custom_dataset"
31 |     file: str = "getting-started/finetuning/datasets/custom_dataset.py"
32 |     train_split: str = "train"
33 |     test_split: str = "validation"
34 |     data_path: str = ""
35 | 
36 | @dataclass
37 | class llamaguard_toxicchat_dataset:
38 |     dataset: str = "llamaguard_toxicchat_dataset"
39 |     train_split: str = "train"
40 |     test_split: str = "test"
41 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/configs/fsdp.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | from dataclasses import dataclass
 5 | 
 6 | from torch.distributed.fsdp import ShardingStrategy
 7 | from torch.distributed.fsdp.fully_sharded_data_parallel import StateDictType
 8 | 
 9 | @dataclass
10 | class fsdp_config:
11 |     mixed_precision: bool=True
12 |     use_fp16: bool=False # use fp16 for all fsdp.MixedPrecision dtypes (param, reduce, buffer, see https://pytorch.org/docs/stable/fsdp.html#torch.distributed.fsdp.MixedPrecision)
13 |     sharding_strategy: ShardingStrategy = ShardingStrategy.FULL_SHARD # HYBRID_SHARD "Full Shard within a node DDP cross Nodes", SHARD_GRAD_OP "Shard only Gradients and Optimizer States", NO_SHARD "Similar to DDP".
14 |     hsdp : bool =False # Require HYBRID_SHARD to be set. This flag can extend the HYBRID_SHARD by allowing sharding a model on customized number of GPUs (Sharding_group) and Replicas over Sharding_group.
15 |     sharding_group_size : int=0 # requires hsdp to be set. This specifies the sharding group size, number of GPUs that you model can fit into to form a replica of a model.
16 |     replica_group_size: int=0 #requires hsdp to be set. This specifies the replica group size, which is world_size/sharding_group_size.
17 |     checkpoint_type: StateDictType = StateDictType.SHARDED_STATE_DICT  # alternatively FULL_STATE_DICT can be used. SHARDED_STATE_DICT saves one file with sharded weights per rank while FULL_STATE_DICT will collect all weights on rank 0 and save them in a single file.
18 |     fsdp_activation_checkpointing: bool=True
19 |     fsdp_cpu_offload: bool=False
20 |     pure_bf16: bool = False  # disables mixed precision, and runs in pure bfloat16
21 |     optimizer: str= "AdamW"
22 |     
23 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/configs/peft.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | from dataclasses import dataclass, field
 5 | from typing import List
 6 | 
 7 | @dataclass
 8 | class lora_config:
 9 |      r: int=8
10 |      lora_alpha: int=32
11 |      target_modules: List[str] = field(default_factory=lambda: ["q_proj", "v_proj"])
12 |      bias= "none"
13 |      task_type: str= "CAUSAL_LM"
14 |      lora_dropout: float=0.05
15 |      inference_mode: bool = False
16 | 
17 | @dataclass
18 | class llama_adapter_config:
19 |      adapter_len: int= 10
20 |      adapter_layers: int= 30
21 |      task_type: str= "CAUSAL_LM"
22 | 
23 | #CAUTION prefix tuning is currently not supported
24 | @dataclass
25 | class prefix_config:
26 |      num_virtual_tokens: int=30
27 |      task_type: str= "CAUSAL_LM"
28 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/configs/quantization.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | from dataclasses import dataclass
 5 | from typing import Optional
 6 | import torch
 7 | from transformers import BitsAndBytesConfig
 8 | 
 9 | @dataclass
10 | class quantization_config:
11 |     quant_type: str =  "fp4" # "fp4" or "nf4"
12 |     compute_dtype: torch.dtype = torch.bfloat16
13 |     use_double_quant: bool = False
14 |     quant_storage: torch.dtype = torch.bfloat16
15 | 
16 |     def create_bnb_config(self, quantization: str) -> BitsAndBytesConfig:
17 |         if quantization not in {"4bit", "8bit"}:
18 |             raise ValueError("quantization must be either '4bit' or '8bit'")
19 | 
20 |         if quantization == "4bit":
21 |             config_params = {
22 |                 "bnb_4bit_quant_type": self.quant_type,
23 |                 "bnb_4bit_compute_dtype": self.compute_dtype,
24 |                 "bnb_4bit_use_double_quant": self.use_double_quant,
25 |                 "bnb_4bit_quant_storage": self.quant_storage,
26 |             }
27 |             
28 |             return BitsAndBytesConfig(load_in_4bit=True, **config_params)
29 |         else:
30 |             return BitsAndBytesConfig(load_in_8bit=True)
31 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/configs/wandb.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | from typing import List, Optional
 5 | from dataclasses import dataclass, field
 6 | 
 7 | @dataclass
 8 | class wandb_config:
 9 |     project: str = 'llama_cookbook' # wandb project name
10 |     entity: Optional[str] = None # wandb entity name
11 |     job_type: Optional[str] = None
12 |     tags: Optional[List[str]] = None
13 |     group: Optional[str] = None
14 |     notes: Optional[str] = None
15 |     mode: Optional[str] = None
16 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/data/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.


--------------------------------------------------------------------------------
/src/llama_cookbook/data/concatenator.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | from tqdm import tqdm
 5 | from itertools import chain
 6 | 
 7 | from torch.utils.data import Dataset
 8 | 
 9 | 
10 | class ConcatDataset(Dataset):
11 |     def __init__(self, dataset, chunk_size=4096):
12 |         self.dataset = dataset
13 |         self.chunk_size = chunk_size
14 | 
15 |         self.samples = []
16 | 
17 |         buffer = {
18 |             "input_ids": [],
19 |             "attention_mask": [],
20 |             "labels": [],
21 |             }
22 | 
23 |         for sample in tqdm(self.dataset, desc="Preprocessing dataset", dynamic_ncols=True):
24 |             buffer = {k: v + sample[k] for k,v in buffer.items()}
25 | 
26 |             while len(next(iter(buffer.values()))) > self.chunk_size:
27 |                 self.samples.append({k: v[:self.chunk_size] for k,v in buffer.items()})
28 |                 buffer = {k: v[self.chunk_size:] for k,v in buffer.items()}
29 | 
30 |     def __getitem__(self, idx):
31 |         return self.samples[idx]
32 | 
33 |     def __len__(self):
34 |         return len(self.samples)
35 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/data/llama_guard/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the Llama Guard License Agreement.


--------------------------------------------------------------------------------
/src/llama_cookbook/datasets/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | from functools import partial
 5 | 
 6 | from llama_cookbook.datasets.grammar_dataset.grammar_dataset import get_dataset as get_grammar_dataset
 7 | from llama_cookbook.datasets.alpaca_dataset import InstructionDataset as get_alpaca_dataset
 8 | from llama_cookbook.datasets.custom_dataset import get_custom_dataset,get_data_collator
 9 | from llama_cookbook.datasets.samsum_dataset import get_preprocessed_samsum as get_samsum_dataset
10 | from llama_cookbook.datasets.toxicchat_dataset import get_llamaguard_toxicchat_dataset as get_llamaguard_toxicchat_dataset
11 | DATASET_PREPROC = {
12 |     "alpaca_dataset": partial(get_alpaca_dataset),
13 |     "grammar_dataset": get_grammar_dataset,
14 |     "samsum_dataset": get_samsum_dataset,
15 |     "custom_dataset": get_custom_dataset,
16 |     "llamaguard_toxicchat_dataset": get_llamaguard_toxicchat_dataset,
17 | }
18 | DATALOADER_COLLATE_FUNC = {
19 |     "custom_dataset": get_data_collator
20 | }
21 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/datasets/grammar_dataset/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
3 | 
4 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/datasets/samsum_dataset.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | # For dataset details visit: https://huggingface.co/datasets/samsum
 5 | 
 6 | import copy
 7 | import datasets
 8 | 
 9 | from unittest.mock import patch
10 | 
11 | @patch('builtins.input', return_value="N")
12 | def load_samsum(split, _):
13 |     try:
14 |         ds = datasets.load_dataset("knkarthick/samsum", split=split)
15 |     except ValueError as e:
16 |         if "trust_remote_code" in str(e):
17 |           raise ValueError("Loading knkarthick/samsum requires you to execute the dataset script in that repo on your local machine. Make sure you have read the code there to avoid malicious use, then set HF_DATASETS_TRUST_REMOTE_CODE env variable to True.") from e
18 |         else:
19 |           raise e
20 |     return ds
21 | 
22 | 
23 | def get_preprocessed_samsum(dataset_config, tokenizer, split):
24 |     dataset = load_samsum(split)
25 | 
26 |     prompt = (
27 |         f"Summarize this dialog:\n{{dialog}}\n---\nSummary:\n"
28 |     )
29 | 
30 |     def apply_prompt_template(sample):
31 |         return {
32 |             "prompt": prompt.format(dialog=sample["dialogue"]),
33 |             "summary": sample["summary"],
34 |         }
35 | 
36 |     dataset = dataset.map(apply_prompt_template, remove_columns=list(dataset.features))
37 | 
38 |     def tokenize_add_label(sample):
39 |         prompt = tokenizer.encode(tokenizer.bos_token + sample["prompt"], add_special_tokens=False)
40 |         summary = tokenizer.encode(sample["summary"] +  tokenizer.eos_token, add_special_tokens=False)
41 | 
42 |         sample = {
43 |             "input_ids": prompt + summary,
44 |             "attention_mask" : [1] * (len(prompt) + len(summary)),
45 |             "labels": [-100] * len(prompt) + summary,
46 |             }
47 | 
48 |         return sample
49 | 
50 |     dataset = dataset.map(tokenize_add_label, remove_columns=list(dataset.features))
51 | 
52 |     return dataset
53 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/inference/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.


--------------------------------------------------------------------------------
/src/llama_cookbook/inference/chat_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | import json
 5 | 
 6 | def read_dialogs_from_file(file_path):
 7 |     with open(file_path, 'r') as file:
 8 |         dialogs = json.load(file)
 9 |     return dialogs
10 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/model_checkpointing/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | from llama_cookbook.model_checkpointing.checkpoint_handler import (
 5 |     load_model_checkpoint,
 6 |     save_fsdp_model_checkpoint_full,
 7 |     save_peft_checkpoint,
 8 |     save_model_checkpoint,
 9 |     load_optimizer_checkpoint,
10 |     save_optimizer_checkpoint,
11 |     save_model_and_optimizer_sharded,
12 |     load_model_sharded,
13 |     load_sharded_model_single_gpu
14 | )
15 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/policies/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
3 | 
4 | from llama_cookbook.policies.mixed_precision import *
5 | from llama_cookbook.policies.wrapping import *
6 | from llama_cookbook.policies.activation_checkpointing_functions import apply_fsdp_checkpointing
7 | from llama_cookbook.policies.anyprecision_optimizer import AnyPrecisionAdamW
8 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/policies/activation_checkpointing_functions.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | from functools import partial
 5 | 
 6 | from torch.distributed.algorithms._checkpoint.checkpoint_wrapper import (
 7 |     checkpoint_wrapper,
 8 |     CheckpointImpl,
 9 |     apply_activation_checkpointing,
10 | )
11 | from transformers.models.llama.modeling_llama import LlamaDecoderLayer
12 | 
13 | non_reentrant_wrapper = partial(
14 |     checkpoint_wrapper,
15 |     checkpoint_impl=CheckpointImpl.NO_REENTRANT,
16 | )
17 | 
18 | check_fn = lambda submodule: isinstance(submodule, LlamaDecoderLayer)
19 | 
20 | 
21 | def apply_fsdp_checkpointing(model):
22 |     """apply activation checkpointing to model
23 |     returns None as model is updated directly
24 |     """
25 |     print(f"--> applying fsdp activation checkpointing...")
26 | 
27 |     apply_activation_checkpointing(
28 |         model, checkpoint_wrapper_fn=non_reentrant_wrapper, check_fn=check_fn
29 |     )
30 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/policies/mixed_precision.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | import torch
 5 | 
 6 | from torch.distributed.fsdp import (
 7 |     MixedPrecision,
 8 | )
 9 | 
10 | # requires grad scaler in main loop
11 | fpSixteen = MixedPrecision(
12 |     param_dtype=torch.float16,
13 |     # Gradient communication precision.
14 |     reduce_dtype=torch.float16,
15 |     # Buffer precision.
16 |     buffer_dtype=torch.float16,
17 | )
18 | 
19 | bfSixteen = MixedPrecision(
20 |     param_dtype=torch.bfloat16,
21 |     # Gradient communication precision.
22 |     reduce_dtype=torch.bfloat16,
23 |     # Buffer precision.
24 |     buffer_dtype=torch.bfloat16,
25 |     cast_forward_inputs=True,
26 | )
27 | 
28 | bfSixteen_mixed = MixedPrecision(
29 |     param_dtype=torch.float32,
30 |     reduce_dtype=torch.bfloat16,
31 |     buffer_dtype=torch.bfloat16,
32 | )
33 | 
34 | fp32_policy = MixedPrecision(
35 |     param_dtype=torch.float32,
36 |     reduce_dtype=torch.float32,
37 |     buffer_dtype=torch.float32,
38 | )
39 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/policies/wrapping.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | import functools
 5 | 
 6 | from transformers.models.llama.modeling_llama import LlamaDecoderLayer
 7 | from transformers.models.mllama.modeling_mllama import   MllamaSelfAttentionDecoderLayer,MllamaCrossAttentionDecoderLayer,MllamaVisionEncoderLayer
 8 | 
 9 | from torch.distributed.fsdp.wrap import (
10 |     transformer_auto_wrap_policy,
11 |     size_based_auto_wrap_policy,
12 | )
13 | 
14 | 
15 | def get_size_policy(min_params=1e8):
16 |     num_wrap_policy = functools.partial(
17 |         size_based_auto_wrap_policy, min_num_params=min_params
18 |     )
19 |     return num_wrap_policy
20 | 
21 | 
22 | def get_llama_wrapper():
23 |     """we register our main layer class and use the fsdp transformer wrapping policy
24 |     ensures embedding layers are in the root fsdp unit for shared access and that fsdp units map to transformer layers
25 |     """
26 |     # ====   use new transformer wrapper
27 | 
28 |     llama_auto_wrap_policy = functools.partial(
29 |         transformer_auto_wrap_policy,
30 |         transformer_layer_cls=set([LlamaDecoderLayer, MllamaSelfAttentionDecoderLayer,MllamaVisionEncoderLayer,MllamaCrossAttentionDecoderLayer])
31 |     )
32 | 
33 |     return llama_auto_wrap_policy
34 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/tools/README.md:
--------------------------------------------------------------------------------
 1 | # Convert Hugging Face llama weights to official llama consolidated format
 2 | 
 3 | This is the reverse conversion for `convert_llama_weights_to_hf.py` script from the transformer package.
 4 | 
 5 | ## Step 0: Convert to consolidated format
 6 | - Create an output directory for the converted weights, such as `test70B`.
 7 | - Copy file params.json from the official llama download into that directory.
 8 | - Run the conversion script. `model-path` can be a Hugging Face hub model or a local hf model directory.
 9 | ```
10 | python -m llama_cookbook.tools.convert_hf_weights_to_llama --model-path meta-llama/Meta-Llama-3.1-70B-Instruct --output-dir test70B --model-size 70B
11 | ```
12 | 
13 | ## Step 1: Run inference
14 | Checkout the official llama 3 inference [repo](https://github.com/meta-llama/llama3). Test using chat or text completion.
15 | ```
16 | torchrun --nproc_per_node 8 example_chat_completion.py --ckpt_dir ./test70B --tokenizer_path ${llama_3_dir}/tokenizer.model
17 | ```
18 | 
19 | For validation, please compare the converted weights with official llama 2 weights
20 | ```
21 | python compare_llama_weights.py test70B ${Llama-3-70B-Instruct_dir}
22 | ```
23 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/tools/compare_llama_weights.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | import gc
 5 | import glob
 6 | import os
 7 | import sys
 8 | 
 9 | import torch
10 | import tqdm
11 | 
12 | 
13 | def main() -> None:
14 |     """Compare two llama checkpoint directories"""
15 | 
16 |     one_files = sorted(glob.glob(os.path.join(sys.argv[1], "consolidated.*.pth")))
17 |     two_files = sorted(glob.glob(os.path.join(sys.argv[2], "consolidated.*.pth")))
18 |     assert len(one_files) == len(
19 |         two_files
20 |     ), "One directory has {} files while another has {} files.".format(
21 |         len(one_files), len(two_files)
22 |     )
23 | 
24 |     deltas = []
25 |     for i in tqdm.trange(len(one_files), desc="Comparing shards"):
26 |         one = torch.load(one_files[i])
27 |         two = torch.load(two_files[i])
28 |         assert len(one) == len(
29 |             two
30 |         ), "shard should have the same length: {} != {}".format(len(one), len(two))
31 |         one = sorted(one.items(), key=lambda x: x[0])
32 |         two = sorted(two.items(), key=lambda x: x[0])
33 | 
34 |         for _, (v, w) in enumerate(zip(one, two)):
35 |             assert v[0] == w[0], "{} != {}".format(v[0], w[0])
36 |             assert v[1].shape == w[1].shape, "tensor {} shape {} != {}".format(
37 |                 v[0], v[1].shape, w[1].shape
38 |             )
39 | 
40 |             delta = (v[1] - w[1]).abs().max().item()
41 |             deltas.append((i, v[0], delta, w[1].abs().mean().item()))
42 |         del one
43 |         del two
44 |         gc.collect()
45 | 
46 |     deltas = sorted(deltas, key=lambda x: x[-2], reverse=True)
47 |     print("Top 10 largest deltas:")
48 |     for i, k, delta, value in deltas[:10]:
49 |         print(f"  shard {i} {k}: {delta} vs {value}")
50 | 
51 | 
52 | if __name__ == "__main__":
53 |     main()
54 | 


--------------------------------------------------------------------------------
/src/llama_cookbook/utils/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
3 | 
4 | from llama_cookbook.utils.memory_utils import MemoryTrace
5 | from llama_cookbook.utils.dataset_utils import *
6 | from llama_cookbook.utils.fsdp_utils import fsdp_auto_wrap_policy, hsdp_device_mesh, get_policies
7 | from llama_cookbook.utils.train_utils import *


--------------------------------------------------------------------------------
/src/tests/utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
 3 | 
 4 | from transformers import AutoTokenizer
 5 | 
 6 | 
 7 | class FakeTokenizer(object):
 8 |     def __init__(self):
 9 |         self.pad_token_id = 0
10 |         self.bos_token_id = 42
11 |         self.eos_token_id = 43
12 |         self.sep_token_id = 3
13 |         self.vocab_size = 128256
14 | 
15 |         self.pad_token = "<|pad_id|>"
16 |         self.bos_token = "<|bos_id|>"
17 |         self.eos_token = "<|eos_id|>"
18 |         self.sep_token = "<|sep_id|>"
19 |         self.tokenizer = self
20 |         self.padding_side = "left"
21 | 
22 |     def __call__(self, *args, **kwargs):
23 |         ids = self.encode(*args, **kwargs)
24 |         return {"input_ids": ids}
25 | 
26 |     def encode(self, text, *args, **kwargs):
27 |         return [self.bos_token_id] + [len(c) for c in text.split(" ")] + [self.eos_token_id]
28 |     
29 |     def __len__(self):
30 |         return 128256
31 |     
32 |     def pad(self, *args, **kwargs):
33 |         args = args[0]
34 |         max_len = max([len(a["input_ids"]) for a in args])
35 |         for a in args:
36 |             for k in a.keys():
37 |                 a[k] = a[k] + ([self.pad_token_id if k == "input_ids" else 0] * (max_len - len(a)))
38 |         out = {}
39 |         for k in args[0].keys():
40 |             out[k] = [a[k] for a in args]
41 |         return out
42 | 
43 | 
44 | def maybe_tokenizer(name):
45 |     if name == "fake_llama":
46 |         return FakeTokenizer()
47 |     try:
48 |         return AutoTokenizer.from_pretrained(name)
49 |     except OSError:
50 |         return None
51 | 


--------------------------------------------------------------------------------