├── README.md ├── assets └── figure.png ├── configs ├── default_prompts │ ├── ag_news.j2 │ ├── anli.j2 │ ├── boolq.j2 │ ├── cosmos_qa.j2 │ ├── hellaswag.j2 │ ├── imdb.j2 │ ├── nq_open.j2 │ ├── trivia_qa.j2 │ └── tweet_emotion.j2 └── metric │ ├── few_shot_accuracy_defaults.yaml │ ├── permutational_sensitivity_defaults.yaml │ ├── perturbational_accuracy_defaults.yaml │ ├── selectional_sensitivity_defaults.yaml │ └── zero_shot_accuracy_defaults.yaml ├── data ├── __init__.py ├── ag_news.py ├── anli.py ├── boolq.py ├── cosmos_qa.py ├── dataset.py ├── hellaswag.py ├── imdb.py ├── nq_open.py ├── trivia_qa.py └── tweet_emotion.py ├── decoders ├── __init__.py ├── constrained_label_generation.py ├── constrained_per_example_label_generation.py ├── decoder.py ├── greedy_generation.py └── nucleus_generation.py ├── evaluate_instruction.py ├── instructions ├── ape │ ├── ag_news.yaml │ ├── anli.yaml │ ├── boolq.yaml │ ├── cosmos_qa.yaml │ ├── hellaswag.yaml │ ├── imdb.yaml │ ├── nq_open.yaml │ ├── trivia_qa.yaml │ └── tweet_emotion.yaml ├── chat_gpt_prompts │ ├── ag_news.yaml │ ├── anli.yaml │ ├── boolq.yaml │ ├── cosmos_qa.yaml │ ├── hellaswag.yaml │ ├── imdb.yaml │ ├── nq_open.yaml │ ├── trivia_qa.yaml │ └── tweet_emotion.yaml ├── generic_instruction │ ├── ag_news.yaml │ ├── anli.yaml │ ├── boolq.yaml │ ├── cosmos_qa.yaml │ ├── hellaswag.yaml │ ├── imdb.yaml │ ├── nq_open.yaml │ ├── trivia_qa.yaml │ └── tweet_emotion.yaml ├── low_perplexity_prompts │ ├── bloom1b1 │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ ├── bloom1b7 │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ ├── bloom3b │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ ├── bloom7b1 │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ ├── gptneo1b3 │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ ├── gptneo2b7 │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ ├── gptneox20b │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ ├── llama13b │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ ├── llama7b │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ ├── opt13b │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ ├── opt1b3 │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ ├── opt2b7 │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml │ └── opt6b7 │ │ ├── ag_news.yaml │ │ ├── anli.yaml │ │ ├── boolq.yaml │ │ ├── cosmos_qa.yaml │ │ ├── hellaswag.yaml │ │ ├── imdb.yaml │ │ ├── nq_open.yaml │ │ ├── trivia_qa.yaml │ │ └── tweet_emotion.yaml ├── manual │ ├── ag_news.yaml │ ├── anli.yaml │ ├── boolq.yaml │ ├── cosmos_qa.yaml │ ├── hellaswag.yaml │ ├── imdb.yaml │ ├── nq_open.yaml │ ├── trivia_qa.yaml │ └── tweet_emotion.yaml ├── no_instruction │ ├── ag_news.yaml │ ├── anli.yaml │ ├── boolq.yaml │ ├── cosmos_qa.yaml │ ├── hellaswag.yaml │ ├── imdb.yaml │ ├── nq_open.yaml │ ├── trivia_qa.yaml │ └── tweet_emotion.yaml └── rlprompt │ ├── ag_news.yaml │ ├── anli.yaml │ ├── boolq.yaml │ ├── cosmos_qa.yaml │ ├── hellaswag.yaml │ ├── imdb.yaml │ └── tweet_emotion.yaml ├── metrics ├── __init__.py ├── few_shot_accuracy.py ├── metric.py ├── permutational_sensitivity.py ├── perturbational_accuracy.py ├── selectional_sensitivity.py ├── utils.py └── zero_shot_accuracy.py ├── models ├── __init__.py ├── base.py ├── bloom1b1.py ├── bloom1b7.py ├── bloom3b.py ├── bloom7b1.py ├── causal_lm.py ├── gptneo1b3.py ├── gptneo2b7.py ├── gptneox20b.py ├── llama13b.py ├── llama7b.py ├── masked_lm.py ├── opt13b.py ├── opt1b3.py ├── opt2b7.py ├── opt6b7.py ├── stablelmbase3b.py ├── stablelmbase7b.py ├── stablelmtuned3b.py └── stablelmtuned7b.py ├── notebooks └── aggregate_results.ipynb ├── requirements.txt ├── templates ├── __init__.py ├── few_shot_template.py └── instruction_based_fs_template.py └── utils.py /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/README.md -------------------------------------------------------------------------------- /assets/figure.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/assets/figure.png -------------------------------------------------------------------------------- /configs/default_prompts/ag_news.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/default_prompts/ag_news.j2 -------------------------------------------------------------------------------- /configs/default_prompts/anli.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/default_prompts/anli.j2 -------------------------------------------------------------------------------- /configs/default_prompts/boolq.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/default_prompts/boolq.j2 -------------------------------------------------------------------------------- /configs/default_prompts/cosmos_qa.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/default_prompts/cosmos_qa.j2 -------------------------------------------------------------------------------- /configs/default_prompts/hellaswag.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/default_prompts/hellaswag.j2 -------------------------------------------------------------------------------- /configs/default_prompts/imdb.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/default_prompts/imdb.j2 -------------------------------------------------------------------------------- /configs/default_prompts/nq_open.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/default_prompts/nq_open.j2 -------------------------------------------------------------------------------- /configs/default_prompts/trivia_qa.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/default_prompts/trivia_qa.j2 -------------------------------------------------------------------------------- /configs/default_prompts/tweet_emotion.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/default_prompts/tweet_emotion.j2 -------------------------------------------------------------------------------- /configs/metric/few_shot_accuracy_defaults.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/metric/few_shot_accuracy_defaults.yaml -------------------------------------------------------------------------------- /configs/metric/permutational_sensitivity_defaults.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/metric/permutational_sensitivity_defaults.yaml -------------------------------------------------------------------------------- /configs/metric/perturbational_accuracy_defaults.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/metric/perturbational_accuracy_defaults.yaml -------------------------------------------------------------------------------- /configs/metric/selectional_sensitivity_defaults.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/configs/metric/selectional_sensitivity_defaults.yaml -------------------------------------------------------------------------------- /configs/metric/zero_shot_accuracy_defaults.yaml: -------------------------------------------------------------------------------- 1 | zero_shot_accuracy: 2 | num_test_instances: 100 -------------------------------------------------------------------------------- /data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/data/__init__.py -------------------------------------------------------------------------------- /data/ag_news.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/data/ag_news.py -------------------------------------------------------------------------------- /data/anli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/data/anli.py -------------------------------------------------------------------------------- /data/boolq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/data/boolq.py -------------------------------------------------------------------------------- /data/cosmos_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/data/cosmos_qa.py -------------------------------------------------------------------------------- /data/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/data/dataset.py -------------------------------------------------------------------------------- /data/hellaswag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/data/hellaswag.py -------------------------------------------------------------------------------- /data/imdb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/data/imdb.py -------------------------------------------------------------------------------- /data/nq_open.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/data/nq_open.py -------------------------------------------------------------------------------- /data/trivia_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/data/trivia_qa.py -------------------------------------------------------------------------------- /data/tweet_emotion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/data/tweet_emotion.py -------------------------------------------------------------------------------- /decoders/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/decoders/__init__.py -------------------------------------------------------------------------------- /decoders/constrained_label_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/decoders/constrained_label_generation.py -------------------------------------------------------------------------------- /decoders/constrained_per_example_label_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/decoders/constrained_per_example_label_generation.py -------------------------------------------------------------------------------- /decoders/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/decoders/decoder.py -------------------------------------------------------------------------------- /decoders/greedy_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/decoders/greedy_generation.py -------------------------------------------------------------------------------- /decoders/nucleus_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/decoders/nucleus_generation.py -------------------------------------------------------------------------------- /evaluate_instruction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/evaluate_instruction.py -------------------------------------------------------------------------------- /instructions/ape/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/ape/ag_news.yaml -------------------------------------------------------------------------------- /instructions/ape/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/ape/anli.yaml -------------------------------------------------------------------------------- /instructions/ape/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/ape/boolq.yaml -------------------------------------------------------------------------------- /instructions/ape/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/ape/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/ape/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/ape/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/ape/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/ape/imdb.yaml -------------------------------------------------------------------------------- /instructions/ape/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/ape/nq_open.yaml -------------------------------------------------------------------------------- /instructions/ape/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/ape/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/ape/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/ape/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/chat_gpt_prompts/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/chat_gpt_prompts/ag_news.yaml -------------------------------------------------------------------------------- /instructions/chat_gpt_prompts/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/chat_gpt_prompts/anli.yaml -------------------------------------------------------------------------------- /instructions/chat_gpt_prompts/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/chat_gpt_prompts/boolq.yaml -------------------------------------------------------------------------------- /instructions/chat_gpt_prompts/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/chat_gpt_prompts/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/chat_gpt_prompts/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/chat_gpt_prompts/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/chat_gpt_prompts/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/chat_gpt_prompts/imdb.yaml -------------------------------------------------------------------------------- /instructions/chat_gpt_prompts/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/chat_gpt_prompts/nq_open.yaml -------------------------------------------------------------------------------- /instructions/chat_gpt_prompts/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/chat_gpt_prompts/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/chat_gpt_prompts/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/chat_gpt_prompts/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/generic_instruction/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/generic_instruction/ag_news.yaml -------------------------------------------------------------------------------- /instructions/generic_instruction/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/generic_instruction/anli.yaml -------------------------------------------------------------------------------- /instructions/generic_instruction/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/generic_instruction/boolq.yaml -------------------------------------------------------------------------------- /instructions/generic_instruction/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/generic_instruction/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/generic_instruction/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/generic_instruction/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/generic_instruction/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/generic_instruction/imdb.yaml -------------------------------------------------------------------------------- /instructions/generic_instruction/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/generic_instruction/nq_open.yaml -------------------------------------------------------------------------------- /instructions/generic_instruction/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/generic_instruction/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/generic_instruction/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/generic_instruction/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b1/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b1/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b1/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b1/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b1/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b1/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b1/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b1/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b1/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b1/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b1/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b1/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b1/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b1/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b1/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b1/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b1/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b1/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b7/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b7/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b7/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b7/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b7/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b7/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b7/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b7/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b7/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b7/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b7/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b7/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b7/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b7/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b7/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b7/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom1b7/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom1b7/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom3b/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom3b/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom3b/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom3b/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom3b/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom3b/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom3b/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom3b/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom3b/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom3b/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom3b/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom3b/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom3b/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom3b/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom3b/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom3b/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom3b/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom3b/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom7b1/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom7b1/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom7b1/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom7b1/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom7b1/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom7b1/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom7b1/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom7b1/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom7b1/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom7b1/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom7b1/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom7b1/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom7b1/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom7b1/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom7b1/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom7b1/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/bloom7b1/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/bloom7b1/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo1b3/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo1b3/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo1b3/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo1b3/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo1b3/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo1b3/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo1b3/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo1b3/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo1b3/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo1b3/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo1b3/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo1b3/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo1b3/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo1b3/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo1b3/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo1b3/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo1b3/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo1b3/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo2b7/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo2b7/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo2b7/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo2b7/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo2b7/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo2b7/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo2b7/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo2b7/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo2b7/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo2b7/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo2b7/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo2b7/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo2b7/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo2b7/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo2b7/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo2b7/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneo2b7/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneo2b7/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneox20b/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneox20b/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneox20b/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneox20b/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneox20b/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneox20b/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneox20b/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneox20b/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneox20b/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneox20b/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneox20b/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneox20b/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneox20b/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneox20b/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneox20b/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneox20b/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/gptneox20b/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/gptneox20b/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama13b/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama13b/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama13b/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama13b/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama13b/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama13b/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama13b/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama13b/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama13b/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama13b/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama13b/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama13b/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama13b/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama13b/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama13b/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama13b/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama13b/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama13b/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama7b/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama7b/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama7b/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama7b/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama7b/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama7b/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama7b/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama7b/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama7b/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama7b/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama7b/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama7b/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama7b/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama7b/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama7b/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama7b/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/llama7b/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/llama7b/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt13b/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt13b/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt13b/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt13b/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt13b/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt13b/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt13b/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt13b/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt13b/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt13b/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt13b/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt13b/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt13b/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt13b/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt13b/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt13b/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt13b/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt13b/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt1b3/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt1b3/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt1b3/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt1b3/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt1b3/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt1b3/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt1b3/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt1b3/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt1b3/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt1b3/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt1b3/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt1b3/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt1b3/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt1b3/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt1b3/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt1b3/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt1b3/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt1b3/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt2b7/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt2b7/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt2b7/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt2b7/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt2b7/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt2b7/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt2b7/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt2b7/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt2b7/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt2b7/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt2b7/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt2b7/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt2b7/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt2b7/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt2b7/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt2b7/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt2b7/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt2b7/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt6b7/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt6b7/ag_news.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt6b7/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt6b7/anli.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt6b7/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt6b7/boolq.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt6b7/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt6b7/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt6b7/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt6b7/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt6b7/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt6b7/imdb.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt6b7/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt6b7/nq_open.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt6b7/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt6b7/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/low_perplexity_prompts/opt6b7/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/low_perplexity_prompts/opt6b7/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/manual/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/manual/ag_news.yaml -------------------------------------------------------------------------------- /instructions/manual/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/manual/anli.yaml -------------------------------------------------------------------------------- /instructions/manual/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/manual/boolq.yaml -------------------------------------------------------------------------------- /instructions/manual/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/manual/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/manual/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/manual/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/manual/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/manual/imdb.yaml -------------------------------------------------------------------------------- /instructions/manual/nq_open.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/manual/nq_open.yaml -------------------------------------------------------------------------------- /instructions/manual/trivia_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/manual/trivia_qa.yaml -------------------------------------------------------------------------------- /instructions/manual/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/manual/tweet_emotion.yaml -------------------------------------------------------------------------------- /instructions/no_instruction/ag_news.yaml: -------------------------------------------------------------------------------- 1 | - "" -------------------------------------------------------------------------------- /instructions/no_instruction/anli.yaml: -------------------------------------------------------------------------------- 1 | - "" -------------------------------------------------------------------------------- /instructions/no_instruction/boolq.yaml: -------------------------------------------------------------------------------- 1 | - "" -------------------------------------------------------------------------------- /instructions/no_instruction/cosmos_qa.yaml: -------------------------------------------------------------------------------- 1 | - "" -------------------------------------------------------------------------------- /instructions/no_instruction/hellaswag.yaml: -------------------------------------------------------------------------------- 1 | - "" -------------------------------------------------------------------------------- /instructions/no_instruction/imdb.yaml: -------------------------------------------------------------------------------- 1 | - "" -------------------------------------------------------------------------------- /instructions/no_instruction/nq_open.yaml: -------------------------------------------------------------------------------- 1 | - "" -------------------------------------------------------------------------------- /instructions/no_instruction/trivia_qa.yaml: -------------------------------------------------------------------------------- 1 | - "" -------------------------------------------------------------------------------- /instructions/no_instruction/tweet_emotion.yaml: -------------------------------------------------------------------------------- 1 | - "" -------------------------------------------------------------------------------- /instructions/rlprompt/ag_news.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/rlprompt/ag_news.yaml -------------------------------------------------------------------------------- /instructions/rlprompt/anli.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/rlprompt/anli.yaml -------------------------------------------------------------------------------- /instructions/rlprompt/boolq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/rlprompt/boolq.yaml -------------------------------------------------------------------------------- /instructions/rlprompt/cosmos_qa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/rlprompt/cosmos_qa.yaml -------------------------------------------------------------------------------- /instructions/rlprompt/hellaswag.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/rlprompt/hellaswag.yaml -------------------------------------------------------------------------------- /instructions/rlprompt/imdb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/rlprompt/imdb.yaml -------------------------------------------------------------------------------- /instructions/rlprompt/tweet_emotion.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/instructions/rlprompt/tweet_emotion.yaml -------------------------------------------------------------------------------- /metrics/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/metrics/__init__.py -------------------------------------------------------------------------------- /metrics/few_shot_accuracy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/metrics/few_shot_accuracy.py -------------------------------------------------------------------------------- /metrics/metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/metrics/metric.py -------------------------------------------------------------------------------- /metrics/permutational_sensitivity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/metrics/permutational_sensitivity.py -------------------------------------------------------------------------------- /metrics/perturbational_accuracy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/metrics/perturbational_accuracy.py -------------------------------------------------------------------------------- /metrics/selectional_sensitivity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/metrics/selectional_sensitivity.py -------------------------------------------------------------------------------- /metrics/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/metrics/utils.py -------------------------------------------------------------------------------- /metrics/zero_shot_accuracy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/metrics/zero_shot_accuracy.py -------------------------------------------------------------------------------- /models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/__init__.py -------------------------------------------------------------------------------- /models/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/base.py -------------------------------------------------------------------------------- /models/bloom1b1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/bloom1b1.py -------------------------------------------------------------------------------- /models/bloom1b7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/bloom1b7.py -------------------------------------------------------------------------------- /models/bloom3b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/bloom3b.py -------------------------------------------------------------------------------- /models/bloom7b1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/bloom7b1.py -------------------------------------------------------------------------------- /models/causal_lm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/causal_lm.py -------------------------------------------------------------------------------- /models/gptneo1b3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/gptneo1b3.py -------------------------------------------------------------------------------- /models/gptneo2b7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/gptneo2b7.py -------------------------------------------------------------------------------- /models/gptneox20b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/gptneox20b.py -------------------------------------------------------------------------------- /models/llama13b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/llama13b.py -------------------------------------------------------------------------------- /models/llama7b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/llama7b.py -------------------------------------------------------------------------------- /models/masked_lm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/masked_lm.py -------------------------------------------------------------------------------- /models/opt13b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/opt13b.py -------------------------------------------------------------------------------- /models/opt1b3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/opt1b3.py -------------------------------------------------------------------------------- /models/opt2b7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/opt2b7.py -------------------------------------------------------------------------------- /models/opt6b7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/opt6b7.py -------------------------------------------------------------------------------- /models/stablelmbase3b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/stablelmbase3b.py -------------------------------------------------------------------------------- /models/stablelmbase7b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/stablelmbase7b.py -------------------------------------------------------------------------------- /models/stablelmtuned3b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/stablelmtuned3b.py -------------------------------------------------------------------------------- /models/stablelmtuned7b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/models/stablelmtuned7b.py -------------------------------------------------------------------------------- /notebooks/aggregate_results.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/notebooks/aggregate_results.ipynb -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/requirements.txt -------------------------------------------------------------------------------- /templates/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/templates/__init__.py -------------------------------------------------------------------------------- /templates/few_shot_template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/templates/few_shot_template.py -------------------------------------------------------------------------------- /templates/instruction_based_fs_template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/templates/instruction_based_fs_template.py -------------------------------------------------------------------------------- /utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/princeton-nlp/InstructEval/HEAD/utils.py --------------------------------------------------------------------------------