├── .codespell-ignore-words.txt ├── .gitignore ├── .pre-commit-config.yaml ├── LICENSE ├── README.md ├── assets ├── logo.png ├── logo_baai.png ├── logo_bupt.png └── logo_pku.png ├── development.md ├── eval_anything ├── Arial.ttf ├── __init__.py ├── __main__.py ├── benchmarks │ ├── __init__.py │ ├── benchmark.md │ ├── cot_fewshot │ │ ├── agieval.csv │ │ ├── gsm8k_main.json │ │ └── mmlupro.json │ ├── fewshot │ │ └── truthfulqa.json │ ├── safedata │ │ ├── BeaverTails-Evaluation.json │ │ ├── CDialBias.csv │ │ ├── DecodingTrust.jsonl │ │ ├── Sexual_orientation.jsonl │ │ ├── confaide.json │ │ ├── harmful_behaviors.csv │ │ ├── mitre_prompts_multilingual_machine_translated.json │ │ ├── output.json │ │ ├── split_instructions.json │ │ ├── test.csv │ │ └── test.jsonl │ ├── text_audio_to_text │ │ └── mmau │ │ │ ├── configs.yaml │ │ │ └── eval.py │ ├── text_image_to_text │ │ ├── mathvision │ │ │ ├── configs.yaml │ │ │ └── eval.py │ │ └── mmmu │ │ │ ├── configs.yaml │ │ │ └── eval.py │ ├── text_to_text │ │ ├── AGIEval │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── tools.py │ │ ├── ARC │ │ │ ├── configs.yaml │ │ │ └── eval.py │ │ ├── AdvBench │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── Anthropics │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── BBQ │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── BeaverTails │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── CDialBias │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── CEval │ │ │ ├── configs.yaml │ │ │ └── eval.py │ │ ├── CMMLU │ │ │ ├── configs.yaml │ │ │ └── eval.py │ │ ├── Cona │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── Confaide │ │ │ ├── configs.yaml │ │ │ └── eval.py │ │ ├── CyberAttackAssistance │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── DeceptionBench │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── DecodingTrust │ │ │ ├── configs.yaml │ │ │ └── eval.py │ │ ├── Dice │ │ │ └── eval.py │ │ ├── DoAnythingNow │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── DoNotAnswer │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── FakeAlignment │ │ │ ├── LLM_utils.py │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ ├── prompts.py │ │ │ └── safety.jsonl │ │ ├── Flames │ │ │ ├── Flames_1k_Chinese.jsonl │ │ │ ├── configs.yaml │ │ │ ├── configuration_internlm.py │ │ │ ├── eval.py │ │ │ ├── infer.py │ │ │ ├── modeling_internlm.py │ │ │ ├── tokenization_internlm.py │ │ │ └── utils.py │ │ ├── HExPHI │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── HarmBench │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── HarmfulQ │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── HumanEval │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── metrics.py │ │ ├── LatentJailbreak │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── MIC │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── MMLUPRO │ │ │ ├── configs.yaml │ │ │ └── eval.py │ │ ├── MaliciousInstruct │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── MaliciousInstructions │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── MoralBench │ │ │ ├── README.md │ │ │ ├── answers │ │ │ │ ├── 6_concepts.json │ │ │ │ ├── 6_concepts_compare.json │ │ │ │ ├── MFQ_30.json │ │ │ │ └── MFQ_30_compare.json │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ ├── main.py │ │ │ ├── questions │ │ │ │ ├── 6_concepts │ │ │ │ │ ├── authority_1.txt │ │ │ │ │ ├── authority_2.txt │ │ │ │ │ ├── authority_3.txt │ │ │ │ │ ├── authority_4.txt │ │ │ │ │ ├── fairness_1.txt │ │ │ │ │ ├── fairness_2.txt │ │ │ │ │ ├── fairness_3.txt │ │ │ │ │ ├── fairness_4.txt │ │ │ │ │ ├── harm_1.txt │ │ │ │ │ ├── harm_2.txt │ │ │ │ │ ├── harm_3.txt │ │ │ │ │ ├── harm_4.txt │ │ │ │ │ ├── ingroup_1.txt │ │ │ │ │ ├── ingroup_2.txt │ │ │ │ │ ├── ingroup_3.txt │ │ │ │ │ ├── ingroup_4.txt │ │ │ │ │ ├── liberty_1.txt │ │ │ │ │ ├── liberty_2.txt │ │ │ │ │ ├── liberty_3.txt │ │ │ │ │ ├── liberty_4.txt │ │ │ │ │ ├── purity_1.txt │ │ │ │ │ ├── purity_2.txt │ │ │ │ │ ├── purity_3.txt │ │ │ │ │ └── purity_4.txt │ │ │ │ ├── 6_concepts_compare │ │ │ │ │ ├── authority_1.txt │ │ │ │ │ ├── authority_2.txt │ │ │ │ │ ├── authority_3.txt │ │ │ │ │ ├── authority_4.txt │ │ │ │ │ ├── fairness_1.txt │ │ │ │ │ ├── fairness_2.txt │ │ │ │ │ ├── fairness_3.txt │ │ │ │ │ ├── fairness_4.txt │ │ │ │ │ ├── harm_1.txt │ │ │ │ │ ├── harm_2.txt │ │ │ │ │ ├── harm_3.txt │ │ │ │ │ ├── harm_4.txt │ │ │ │ │ ├── ingroup_1.txt │ │ │ │ │ ├── ingroup_2.txt │ │ │ │ │ ├── ingroup_3.txt │ │ │ │ │ ├── ingroup_4.txt │ │ │ │ │ ├── liberty_1.txt │ │ │ │ │ ├── liberty_2.txt │ │ │ │ │ ├── liberty_3.txt │ │ │ │ │ ├── liberty_4.txt │ │ │ │ │ ├── purity_1.txt │ │ │ │ │ ├── purity_2.txt │ │ │ │ │ ├── purity_3.txt │ │ │ │ │ └── purity_4.txt │ │ │ │ ├── MFQ_30 │ │ │ │ │ ├── authority_1.txt │ │ │ │ │ ├── authority_2.txt │ │ │ │ │ ├── authority_3.txt │ │ │ │ │ ├── authority_4.txt │ │ │ │ │ ├── fairness_1.txt │ │ │ │ │ ├── fairness_2.txt │ │ │ │ │ ├── fairness_3.txt │ │ │ │ │ ├── fairness_4.txt │ │ │ │ │ ├── harm_1.txt │ │ │ │ │ ├── harm_2.txt │ │ │ │ │ ├── harm_3.txt │ │ │ │ │ ├── harm_4.txt │ │ │ │ │ ├── ingroup_1.txt │ │ │ │ │ ├── ingroup_2.txt │ │ │ │ │ ├── ingroup_3.txt │ │ │ │ │ ├── ingroup_4.txt │ │ │ │ │ ├── purity_1.txt │ │ │ │ │ ├── purity_2.txt │ │ │ │ │ ├── purity_3.txt │ │ │ │ │ └── purity_4.txt │ │ │ │ └── MFQ_30_compare │ │ │ │ │ ├── authority_1.txt │ │ │ │ │ ├── authority_2.txt │ │ │ │ │ ├── authority_3.txt │ │ │ │ │ ├── authority_4.txt │ │ │ │ │ ├── fairness_1.txt │ │ │ │ │ ├── fairness_2.txt │ │ │ │ │ ├── fairness_3.txt │ │ │ │ │ ├── fairness_4.txt │ │ │ │ │ ├── harm_1.txt │ │ │ │ │ ├── harm_2.txt │ │ │ │ │ ├── harm_3.txt │ │ │ │ │ ├── harm_4.txt │ │ │ │ │ ├── ingroup_1.txt │ │ │ │ │ ├── ingroup_2.txt │ │ │ │ │ ├── ingroup_3.txt │ │ │ │ │ ├── ingroup_4.txt │ │ │ │ │ ├── purity_1.txt │ │ │ │ │ ├── purity_2.txt │ │ │ │ │ ├── purity_3.txt │ │ │ │ │ └── purity_4.txt │ │ │ ├── template │ │ │ │ └── moral_system.txt │ │ │ └── utils.py │ │ ├── MoralChoice │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── RedEval │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── SandP │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── SimpleSafetyTests │ │ │ └── Strongreject │ │ │ │ ├── configs.yaml │ │ │ │ ├── eval.py │ │ │ │ └── utils.py │ │ ├── Strongreject │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── TDCRedTeaming │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── TruthfulQA │ │ │ ├── configs.yaml │ │ │ ├── dataloader.py │ │ │ ├── eval.py │ │ │ ├── metrics.py │ │ │ └── tools.py │ │ ├── XSTest │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── XSafety │ │ │ ├── Multilingual_safety_benchmark │ │ │ │ ├── LICENSE │ │ │ │ ├── README.md │ │ │ │ ├── ar │ │ │ │ │ ├── Crimes_And_Illegal_Activities.csv │ │ │ │ │ ├── Ethics_And_Morality.csv │ │ │ │ │ ├── Goal_Hijacking.csv │ │ │ │ │ ├── Inquiry_With_Unsafe_Opinion.csv │ │ │ │ │ ├── Insult.csv │ │ │ │ │ ├── Mental_Health.csv │ │ │ │ │ ├── Physical_Harm.csv │ │ │ │ │ ├── Privacy_And_Property.csv │ │ │ │ │ ├── Prompt_Leaking.csv │ │ │ │ │ ├── Reverse_Exposure.csv │ │ │ │ │ ├── Role_Play_Instruction.csv │ │ │ │ │ ├── Unfairness_And_Discrimination.csv │ │ │ │ │ ├── Unsafe_Instruction_Topic.csv │ │ │ │ │ └── commonsense.csv │ │ │ │ ├── bn │ │ │ │ │ ├── Crimes_And_Illegal_Activities_n.xlsx │ │ │ │ │ ├── Ethics_And_Morality_n.xlsx │ │ │ │ │ ├── Goal_Hijacking_n.xlsx │ │ │ │ │ ├── Inquiry_With_Unsafe_Opinion_n.xlsx │ │ │ │ │ ├── Insult_n.xlsx │ │ │ │ │ ├── Mental_Health_n.xlsx │ │ │ │ │ ├── Physical_Harm_n.xlsx │ │ │ │ │ ├── Privacy_And_Property_n.xlsx │ │ │ │ │ ├── Prompt_Leaking_n.xlsx │ │ │ │ │ ├── Reverse_Exposure_n.xlsx │ │ │ │ │ ├── Role_Play_Instruction_n.xlsx │ │ │ │ │ ├── Unfairness_And_Discrimination_n.xlsx │ │ │ │ │ ├── Unsafe_Instruction_Topic_n.xlsx │ │ │ │ │ └── commonsense.csv │ │ │ │ ├── de │ │ │ │ │ ├── Crimes_And_Illegal_Activities.csv │ │ │ │ │ ├── Ethics_And_Morality.csv │ │ │ │ │ ├── Goal_Hijacking.csv │ │ │ │ │ ├── Inquiry_With_Unsafe_Opinion.csv │ │ │ │ │ ├── Insult.csv │ │ │ │ │ ├── Mental_Health.csv │ │ │ │ │ ├── Physical_Harm.csv │ │ │ │ │ ├── Privacy_And_Property.csv │ │ │ │ │ ├── Prompt_Leaking.csv │ │ │ │ │ ├── Reverse_Exposure.csv │ │ │ │ │ ├── Role_Play_Instruction.csv │ │ │ │ │ ├── Unfairness_And_Discrimination.csv │ │ │ │ │ ├── Unsafe_Instruction_Topic.csv │ │ │ │ │ └── commonsense.csv │ │ │ │ ├── en │ │ │ │ │ ├── Crimes_And_Illegal_Activities_en.csv │ │ │ │ │ ├── Ethics_And_Morality_n.csv │ │ │ │ │ ├── Goal_Hijacking_n.csv │ │ │ │ │ ├── Inquiry_With_Unsafe_Opinion_n.csv │ │ │ │ │ ├── Insult_n.csv │ │ │ │ │ ├── Mental_Health_n.csv │ │ │ │ │ ├── Physical_Harm_n.csv │ │ │ │ │ ├── Privacy_And_Property_n.csv │ │ │ │ │ ├── Prompt_Leaking_n.csv │ │ │ │ │ ├── Reverse_Exposure_n.csv │ │ │ │ │ ├── Role_Play_Instruction_n.csv │ │ │ │ │ ├── Unfairness_And_Discrimination_n.csv │ │ │ │ │ ├── Unsafe_Instruction_Topic_n.csv │ │ │ │ │ └── commonsense.csv │ │ │ │ ├── fr │ │ │ │ │ ├── Crimes_And_Illegal_Activities.csv │ │ │ │ │ ├── Ethics_And_Morality.csv │ │ │ │ │ ├── Goal_Hijacking.csv │ │ │ │ │ ├── Inquiry_With_Unsafe_Opinion.csv │ │ │ │ │ ├── Insult.csv │ │ │ │ │ ├── Mental_Health.csv │ │ │ │ │ ├── Physical_Harm.csv │ │ │ │ │ ├── Privacy_And_Property.csv │ │ │ │ │ ├── Prompt_Leaking.csv │ │ │ │ │ ├── Reverse_Exposure.csv │ │ │ │ │ ├── Role_Play_Instruction.csv │ │ │ │ │ ├── Unfairness_And_Discrimination.csv │ │ │ │ │ ├── Unsafe_Instruction_Topic.csv │ │ │ │ │ └── commonsense.csv │ │ │ │ ├── hi │ │ │ │ │ ├── Crimes_And_Illegal_Activities.csv │ │ │ │ │ ├── Ethics_And_Morality.csv │ │ │ │ │ ├── Goal_Hijacking.csv │ │ │ │ │ ├── Inquiry_With_Unsafe_Opinion.csv │ │ │ │ │ ├── Insult.csv │ │ │ │ │ ├── Mental_Health.csv │ │ │ │ │ ├── Physical_Harm.csv │ │ │ │ │ ├── Privacy_And_Property.csv │ │ │ │ │ ├── Prompt_Leaking.csv │ │ │ │ │ ├── Reverse_Exposure.csv │ │ │ │ │ ├── Role_Play_Instruction.csv │ │ │ │ │ ├── Unfairness_And_Discrimination.csv │ │ │ │ │ ├── Unsafe_Instruction_Topic.csv │ │ │ │ │ ├── commen_sense.csv │ │ │ │ │ └── commonsense.csv │ │ │ │ ├── ja │ │ │ │ │ ├── Crimes_And_Illegal_Activities.csv │ │ │ │ │ ├── Ethics_And_Morality.csv │ │ │ │ │ ├── Goal_Hijacking.csv │ │ │ │ │ ├── Inquiry_With_Unsafe_Opinion.csv │ │ │ │ │ ├── Insult.csv │ │ │ │ │ ├── Mental_Health.csv │ │ │ │ │ ├── Physical_Harm.csv │ │ │ │ │ ├── Privacy_And_Property.csv │ │ │ │ │ ├── Prompt_Leaking.csv │ │ │ │ │ ├── Reverse_Exposure.csv │ │ │ │ │ ├── Role_Play_Instruction.csv │ │ │ │ │ ├── Unfairness_And_Discrimination.csv │ │ │ │ │ ├── Unsafe_Instruction_Topic.csv │ │ │ │ │ └── commonsense.csv │ │ │ │ ├── paper │ │ │ │ │ ├── Overview.png │ │ │ │ │ ├── framework.jpg │ │ │ │ │ ├── frameworks.pdf │ │ │ │ │ ├── result1.jpg │ │ │ │ │ └── result2.jpg │ │ │ │ ├── ru │ │ │ │ │ ├── Crimes_And_Illegal_Activitie.csv │ │ │ │ │ ├── Ethics_And_Morality.csv │ │ │ │ │ ├── Goal_Hijacking.csv │ │ │ │ │ ├── Inquiry_With_Unsafe_Opinion.csv │ │ │ │ │ ├── Insult.csv │ │ │ │ │ ├── Mental_Health.csv │ │ │ │ │ ├── Physical_Harm.csv │ │ │ │ │ ├── Privacy_And_Property.csv │ │ │ │ │ ├── Prompt_Leaking.csv │ │ │ │ │ ├── Reverse_Exposure.csv │ │ │ │ │ ├── Role_Play_Instruction.csv │ │ │ │ │ ├── Unfairness_And_Discrimination.csv │ │ │ │ │ ├── Unsafe_Instruction_Topic.csv │ │ │ │ │ └── commonsense.csv │ │ │ │ ├── sp │ │ │ │ │ ├── Crimes_And_Illegal_Activities.csv │ │ │ │ │ ├── Ethics_And_Morality.csv │ │ │ │ │ ├── Goal_Hijacking.csv │ │ │ │ │ ├── Inquiry_With_Unsafe_Opinion.csv │ │ │ │ │ ├── Insult.csv │ │ │ │ │ ├── Mental_Health.csv │ │ │ │ │ ├── Physical_Harm.csv │ │ │ │ │ ├── Privacy_And_Property.csv │ │ │ │ │ ├── Prompt_Leaking.csv │ │ │ │ │ ├── Reverse_Exposure.csv │ │ │ │ │ ├── Role_Play_Instruction.csv │ │ │ │ │ ├── Unfairness_And_Discrimination.csv │ │ │ │ │ ├── Unsafe_Instruction_Topic.csv │ │ │ │ │ └── commonsense.csv │ │ │ │ └── zh │ │ │ │ │ ├── Crimes_And_Illegal_Activities.csv │ │ │ │ │ ├── Ethics_And_Morality.csv │ │ │ │ │ ├── Goal_Hijacking.csv │ │ │ │ │ ├── Inquiry_With_Unsafe_Opinion.csv │ │ │ │ │ ├── Insult.csv │ │ │ │ │ ├── Mental_Health.csv │ │ │ │ │ ├── Physical_Harm.csv │ │ │ │ │ ├── Privacy_And_Property.csv │ │ │ │ │ ├── Prompt_Leaking.csv │ │ │ │ │ ├── Reverse_Exposure.csv │ │ │ │ │ ├── Role_Play_Instruction.csv │ │ │ │ │ ├── Unfairness_And_Discrimination.csv │ │ │ │ │ ├── Unsafe_Instruction_Topic.csv │ │ │ │ │ └── commonsense.csv │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── aegis_aicontent_safety_dataset │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── air_bench_2024 │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── gptfuzzer │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ ├── prompts.json │ │ │ └── utils.py │ │ ├── gsm8k │ │ │ ├── configs.yaml │ │ │ └── eval.py │ │ ├── jade_db │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── jbb_behaviors │ │ │ ├── classifier.py │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── llm_jailbreak_study │ │ │ ├── configs.yaml │ │ │ ├── data.json │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── mmlu │ │ │ ├── configs.yaml │ │ │ └── eval.py │ │ ├── s_eval │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ └── utils.py │ │ └── salad_bench │ │ │ ├── configs.yaml │ │ │ ├── eval.py │ │ │ ├── evaluator.py │ │ │ ├── metrics.py │ │ │ ├── model_utils.py │ │ │ ├── template.py │ │ │ ├── text_utils.py │ │ │ └── utils.py │ ├── text_video_to_text │ │ └── mmvu │ │ │ ├── configs.yaml │ │ │ └── eval.py │ └── text_vision_to_action │ │ └── chores │ │ ├── configs.yaml │ │ └── eval.py ├── cli.py ├── configs │ ├── evaluate.yaml │ ├── evaluate_Confaide.yaml │ ├── evaluate_DecodingTrust.yaml │ ├── evaluate_DoNotAnswer.yaml │ ├── evaluate_FakeAlignment.yaml │ ├── evaluate_Flames.yaml │ ├── evaluate_HExPHI.yaml │ ├── evaluate_HarmBench.yaml │ ├── evaluate_HarmfulQ.yaml │ ├── evaluate_LatentJailbreak.yaml │ ├── evaluate_MaliciousInstruct.yaml │ ├── evaluate_MaliciousInstructions.yaml │ ├── evaluate_MoralBench.yaml │ ├── evaluate_RedEval.yaml │ ├── evaluate_XSafety.yaml │ ├── evaluate_aegis_aicontent_safety_dataset.yaml │ ├── evaluate_air_bench_2024.yaml │ ├── evaluate_deceptionbench.yaml │ ├── evaluate_gptfuzzer.yaml │ ├── evaluate_jade_db.yaml │ ├── evaluate_jbb_behaviors.yaml │ ├── evaluate_llm_jailbreak_study.yaml │ ├── evaluate_s_eval.yaml │ └── evaluate_salad_bench.yaml ├── dataloader │ ├── base_dataloader.py │ ├── format_mm_dataset.py │ ├── mm_dataloader.py │ ├── t2t_dataloader.py │ └── tv2act_dataloader.py ├── eval-anything-local │ ├── data │ │ ├── HarmfulQ.json │ │ ├── MaliciousInstruct.txt │ │ ├── MaliciousInstructions.json │ │ ├── harmbench_behaviors_text_all.csv │ │ └── latent_jailbreak_data.json │ └── jade_db_data │ │ ├── LICENSE │ │ ├── README.md │ │ ├── jade-db-v1.0 │ │ ├── jade_benchmark_en.csv │ │ └── jade_benchmark_zh.csv │ │ ├── jade-db-v2.0 │ │ ├── jade_benchmark_easy_zh.csv │ │ └── jade_benchmark_medium_zh.csv │ │ └── jade-db-v3.0 │ │ ├── README.md │ │ ├── jade_alignment_hard_zh.csv │ │ └── jade_alignment_medium_zh.csv ├── evaluate_tools │ ├── README.md │ ├── base_tools.py │ ├── cached_requests.py │ ├── metrics.py │ └── t2t_tools.py ├── license │ ├── add_license.py │ └── add_third_party.py ├── models │ ├── api_lm.py │ ├── base_model.py │ ├── hf_lm.py │ ├── hf_mm.py │ ├── hf_vla.py │ ├── vllm_lm.py │ └── vllm_mm.py ├── pipeline │ ├── base_benchmark.py │ ├── base_task.py │ ├── mm_gen_benchmark.py │ ├── mm_und_benchmark.py │ ├── t2t_benchmark.py │ └── tv2act_benchmark.py ├── third_party │ └── SPOC │ │ ├── environment │ │ ├── __init__.py │ │ ├── manipulation_sensors.py │ │ ├── navigation_sensors.py │ │ ├── spoc_objects.py │ │ ├── stretch_controller.py │ │ ├── stretch_state.py │ │ └── vision_sensors.py │ │ ├── spoc_model │ │ ├── __init__.py │ │ ├── agent.py │ │ ├── early_fusion_tsfm_models.py │ │ ├── preprocessors.py │ │ └── text_cond_visual_encoder.py │ │ ├── tasks │ │ ├── __init__.py │ │ ├── abstract_task.py │ │ ├── abstract_task_sampler.py │ │ ├── fetch_task.py │ │ ├── multi_task_eval_sampler.py │ │ ├── object_nav_task.py │ │ ├── pickup_task.py │ │ ├── room_nav_task.py │ │ ├── room_visit_task.py │ │ ├── safety_components.py │ │ └── task_specs.py │ │ └── utils │ │ ├── constants │ │ ├── __init__.py │ │ ├── objaverse_data_dirs.py │ │ ├── object_constants.py │ │ ├── stretch_initialization_utils.py │ │ └── template_verbs.py │ │ ├── data_generation_utils │ │ ├── __init__.py │ │ ├── mp4_utils.py │ │ └── navigation_utils.py │ │ ├── distance_calculation_utils.py │ │ ├── objaverse_annotation.py │ │ ├── online_evaluation_types_and_utils.py │ │ ├── reward_shaper.py │ │ ├── sel_utils.py │ │ ├── sensor_constant_utils.py │ │ ├── string_utils.py │ │ ├── synset_to_best_lemma.json │ │ ├── synset_utils.py │ │ ├── task_datagen_utils.py │ │ ├── task_spec_to_instruction.py │ │ ├── task_type_mapping_utils.py │ │ ├── transformation_util.py │ │ ├── type_utils.py │ │ └── visualization_utils.py ├── utils │ ├── cache_manager.py │ ├── cached_requests.py │ ├── data_type.py │ ├── logger.py │ ├── mm_data_manager.py │ ├── prompt_builders.py │ ├── register.py │ ├── template.py │ ├── utils.py │ └── uuid.py └── version.py ├── pyproject.toml ├── scripts ├── download_dataset.py ├── download_objaverse_houses.py ├── run.sh ├── run_Confaide.sh ├── run_DecodingTrust.sh ├── run_DoNotAnswer.sh ├── run_Flames.sh ├── run_HExPHI.sh ├── run_HarmBench.sh ├── run_LatentJailbreak.sh ├── run_MoralBench.sh ├── run_RedEval.sh ├── run_XSafety.sh ├── run_deceptionbench.sh ├── run_jade_db.sh └── run_vla.sh └── setup.py /.codespell-ignore-words.txt: -------------------------------------------------------------------------------- 1 | ans 2 | res 3 | ths 4 | buld 5 | -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/.gitignore -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/README.md -------------------------------------------------------------------------------- /assets/logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/assets/logo.png -------------------------------------------------------------------------------- /assets/logo_baai.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/assets/logo_baai.png -------------------------------------------------------------------------------- /assets/logo_bupt.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/assets/logo_bupt.png -------------------------------------------------------------------------------- /assets/logo_pku.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/assets/logo_pku.png -------------------------------------------------------------------------------- /development.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/development.md -------------------------------------------------------------------------------- /eval_anything/Arial.ttf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/Arial.ttf -------------------------------------------------------------------------------- /eval_anything/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /eval_anything/__main__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/__main__.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/__init__.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/benchmark.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/benchmark.md -------------------------------------------------------------------------------- /eval_anything/benchmarks/cot_fewshot/agieval.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/cot_fewshot/agieval.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/cot_fewshot/gsm8k_main.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/cot_fewshot/gsm8k_main.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/cot_fewshot/mmlupro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/cot_fewshot/mmlupro.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/fewshot/truthfulqa.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/fewshot/truthfulqa.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/safedata/BeaverTails-Evaluation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/safedata/BeaverTails-Evaluation.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/safedata/CDialBias.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/safedata/CDialBias.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/safedata/DecodingTrust.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/safedata/DecodingTrust.jsonl -------------------------------------------------------------------------------- /eval_anything/benchmarks/safedata/Sexual_orientation.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/safedata/Sexual_orientation.jsonl -------------------------------------------------------------------------------- /eval_anything/benchmarks/safedata/confaide.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/safedata/confaide.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/safedata/harmful_behaviors.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/safedata/harmful_behaviors.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/safedata/mitre_prompts_multilingual_machine_translated.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/safedata/mitre_prompts_multilingual_machine_translated.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/safedata/output.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/safedata/output.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/safedata/split_instructions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/safedata/split_instructions.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/safedata/test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/safedata/test.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/safedata/test.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/safedata/test.jsonl -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_audio_to_text/mmau/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_audio_to_text/mmau/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_audio_to_text/mmau/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_audio_to_text/mmau/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_image_to_text/mathvision/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_image_to_text/mathvision/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_image_to_text/mathvision/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_image_to_text/mathvision/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_image_to_text/mmmu/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_image_to_text/mmmu/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_image_to_text/mmmu/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_image_to_text/mmmu/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/AGIEval/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/AGIEval/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/AGIEval/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/AGIEval/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/AGIEval/tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/AGIEval/tools.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/ARC/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/ARC/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/ARC/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/ARC/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/AdvBench/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/AdvBench/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/AdvBench/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/AdvBench/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/AdvBench/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/AdvBench/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Anthropics/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Anthropics/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Anthropics/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Anthropics/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Anthropics/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Anthropics/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/BBQ/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/BBQ/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/BBQ/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/BBQ/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/BBQ/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/BBQ/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/BeaverTails/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/BeaverTails/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/BeaverTails/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/BeaverTails/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/BeaverTails/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/BeaverTails/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/CDialBias/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/CDialBias/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/CDialBias/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/CDialBias/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/CDialBias/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/CDialBias/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/CEval/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/CEval/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/CEval/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/CEval/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/CMMLU/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/CMMLU/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/CMMLU/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/CMMLU/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Cona/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Cona/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Cona/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Cona/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Cona/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Cona/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Confaide/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Confaide/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Confaide/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Confaide/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/CyberAttackAssistance/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/CyberAttackAssistance/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/CyberAttackAssistance/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/CyberAttackAssistance/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/CyberAttackAssistance/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/CyberAttackAssistance/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/DeceptionBench/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/DeceptionBench/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/DeceptionBench/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/DeceptionBench/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/DeceptionBench/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/DeceptionBench/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/DecodingTrust/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/DecodingTrust/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/DecodingTrust/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/DecodingTrust/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Dice/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Dice/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/DoAnythingNow/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/DoAnythingNow/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/DoAnythingNow/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/DoAnythingNow/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/DoAnythingNow/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/DoAnythingNow/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/DoNotAnswer/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/DoNotAnswer/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/DoNotAnswer/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/DoNotAnswer/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/DoNotAnswer/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/DoNotAnswer/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/FakeAlignment/LLM_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/FakeAlignment/LLM_utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/FakeAlignment/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/FakeAlignment/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/FakeAlignment/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/FakeAlignment/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/FakeAlignment/prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/FakeAlignment/prompts.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/FakeAlignment/safety.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/FakeAlignment/safety.jsonl -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Flames/Flames_1k_Chinese.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Flames/Flames_1k_Chinese.jsonl -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Flames/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Flames/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Flames/configuration_internlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Flames/configuration_internlm.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Flames/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Flames/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Flames/infer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Flames/infer.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Flames/modeling_internlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Flames/modeling_internlm.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Flames/tokenization_internlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Flames/tokenization_internlm.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Flames/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Flames/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HExPHI/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HExPHI/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HExPHI/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HExPHI/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HExPHI/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HExPHI/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HarmBench/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HarmBench/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HarmBench/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HarmBench/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HarmBench/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HarmBench/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HarmfulQ/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HarmfulQ/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HarmfulQ/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HarmfulQ/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HarmfulQ/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HarmfulQ/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HumanEval/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HumanEval/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HumanEval/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HumanEval/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/HumanEval/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/HumanEval/metrics.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/LatentJailbreak/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/LatentJailbreak/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/LatentJailbreak/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/LatentJailbreak/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/LatentJailbreak/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/LatentJailbreak/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MIC/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MIC/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MIC/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MIC/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MIC/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MIC/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MMLUPRO/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MMLUPRO/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MMLUPRO/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MMLUPRO/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MaliciousInstruct/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MaliciousInstruct/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MaliciousInstruct/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MaliciousInstruct/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MaliciousInstruct/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MaliciousInstruct/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MaliciousInstructions/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MaliciousInstructions/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MaliciousInstructions/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MaliciousInstructions/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MaliciousInstructions/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MaliciousInstructions/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/README.md -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/answers/6_concepts.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/answers/6_concepts.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/answers/6_concepts_compare.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/answers/6_concepts_compare.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/answers/MFQ_30.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/answers/MFQ_30.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/answers/MFQ_30_compare.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/answers/MFQ_30_compare.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/main.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/authority_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/authority_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/authority_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/authority_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/authority_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/authority_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/authority_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/authority_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/fairness_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/fairness_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/fairness_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/fairness_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/fairness_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/fairness_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/fairness_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/fairness_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/harm_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/harm_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/harm_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/harm_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/harm_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/harm_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/harm_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/harm_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/ingroup_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/ingroup_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/ingroup_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/ingroup_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/ingroup_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/ingroup_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/ingroup_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/ingroup_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/liberty_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/liberty_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/liberty_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/liberty_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/liberty_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/liberty_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/liberty_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/liberty_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/purity_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/purity_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/purity_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/purity_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/purity_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/purity_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/purity_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts/purity_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/authority_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/authority_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/authority_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/authority_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/authority_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/authority_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/authority_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/authority_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/fairness_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/fairness_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/fairness_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/fairness_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/fairness_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/fairness_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/fairness_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/fairness_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/harm_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/harm_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/harm_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/harm_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/harm_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/harm_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/harm_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/harm_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/ingroup_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/ingroup_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/ingroup_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/ingroup_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/ingroup_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/ingroup_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/ingroup_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/ingroup_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/liberty_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/liberty_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/liberty_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/liberty_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/liberty_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/liberty_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/liberty_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/liberty_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/purity_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/purity_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/purity_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/purity_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/purity_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/purity_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/purity_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/6_concepts_compare/purity_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/authority_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/authority_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/authority_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/authority_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/authority_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/authority_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/authority_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/authority_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/fairness_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/fairness_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/fairness_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/fairness_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/fairness_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/fairness_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/fairness_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/fairness_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/harm_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/harm_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/harm_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/harm_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/harm_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/harm_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/harm_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/harm_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/ingroup_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/ingroup_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/ingroup_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/ingroup_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/ingroup_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/ingroup_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/ingroup_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/ingroup_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/purity_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/purity_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/purity_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/purity_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/purity_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/purity_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/purity_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30/purity_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/authority_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/authority_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/authority_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/authority_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/authority_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/authority_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/authority_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/authority_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/fairness_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/fairness_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/fairness_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/fairness_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/fairness_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/fairness_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/fairness_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/fairness_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/harm_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/harm_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/harm_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/harm_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/harm_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/harm_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/harm_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/harm_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/ingroup_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/ingroup_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/ingroup_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/ingroup_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/ingroup_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/ingroup_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/ingroup_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/ingroup_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/purity_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/purity_1.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/purity_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/purity_2.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/purity_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/purity_3.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/purity_4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/questions/MFQ_30_compare/purity_4.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/template/moral_system.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/template/moral_system.txt -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralBench/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralBench/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralChoice/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralChoice/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralChoice/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralChoice/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/MoralChoice/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/MoralChoice/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/RedEval/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/RedEval/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/RedEval/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/RedEval/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/RedEval/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/RedEval/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/SandP/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/SandP/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/SandP/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/SandP/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/SandP/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/SandP/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/SimpleSafetyTests/Strongreject/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/SimpleSafetyTests/Strongreject/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/SimpleSafetyTests/Strongreject/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/SimpleSafetyTests/Strongreject/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/SimpleSafetyTests/Strongreject/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/SimpleSafetyTests/Strongreject/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Strongreject/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Strongreject/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Strongreject/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Strongreject/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/Strongreject/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/Strongreject/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/TDCRedTeaming/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/TDCRedTeaming/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/TDCRedTeaming/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/TDCRedTeaming/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/TDCRedTeaming/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/TDCRedTeaming/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/TruthfulQA/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/TruthfulQA/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/TruthfulQA/dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/TruthfulQA/dataloader.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/TruthfulQA/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/TruthfulQA/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/TruthfulQA/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/TruthfulQA/metrics.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/TruthfulQA/tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/TruthfulQA/tools.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSTest/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSTest/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSTest/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSTest/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSTest/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSTest/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/LICENSE -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/README.md -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Crimes_And_Illegal_Activities.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Crimes_And_Illegal_Activities.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Ethics_And_Morality.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Ethics_And_Morality.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Goal_Hijacking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Goal_Hijacking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Inquiry_With_Unsafe_Opinion.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Inquiry_With_Unsafe_Opinion.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Insult.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Insult.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Mental_Health.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Mental_Health.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Physical_Harm.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Physical_Harm.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Privacy_And_Property.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Privacy_And_Property.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Prompt_Leaking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Prompt_Leaking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Reverse_Exposure.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Reverse_Exposure.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Role_Play_Instruction.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Role_Play_Instruction.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Unfairness_And_Discrimination.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Unfairness_And_Discrimination.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Unsafe_Instruction_Topic.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/Unsafe_Instruction_Topic.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/commonsense.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ar/commonsense.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Crimes_And_Illegal_Activities_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Crimes_And_Illegal_Activities_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Ethics_And_Morality_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Ethics_And_Morality_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Goal_Hijacking_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Goal_Hijacking_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Inquiry_With_Unsafe_Opinion_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Inquiry_With_Unsafe_Opinion_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Insult_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Insult_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Mental_Health_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Mental_Health_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Physical_Harm_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Physical_Harm_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Privacy_And_Property_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Privacy_And_Property_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Prompt_Leaking_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Prompt_Leaking_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Reverse_Exposure_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Reverse_Exposure_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Role_Play_Instruction_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Role_Play_Instruction_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Unfairness_And_Discrimination_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Unfairness_And_Discrimination_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Unsafe_Instruction_Topic_n.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/Unsafe_Instruction_Topic_n.xlsx -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/commonsense.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/bn/commonsense.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Crimes_And_Illegal_Activities.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Crimes_And_Illegal_Activities.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Ethics_And_Morality.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Ethics_And_Morality.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Goal_Hijacking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Goal_Hijacking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Inquiry_With_Unsafe_Opinion.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Inquiry_With_Unsafe_Opinion.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Insult.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Insult.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Mental_Health.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Mental_Health.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Physical_Harm.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Physical_Harm.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Privacy_And_Property.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Privacy_And_Property.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Prompt_Leaking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Prompt_Leaking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Reverse_Exposure.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Reverse_Exposure.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Role_Play_Instruction.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Role_Play_Instruction.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Unfairness_And_Discrimination.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Unfairness_And_Discrimination.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Unsafe_Instruction_Topic.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/Unsafe_Instruction_Topic.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/commonsense.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/de/commonsense.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Crimes_And_Illegal_Activities_en.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Crimes_And_Illegal_Activities_en.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Ethics_And_Morality_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Ethics_And_Morality_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Goal_Hijacking_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Goal_Hijacking_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Inquiry_With_Unsafe_Opinion_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Inquiry_With_Unsafe_Opinion_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Insult_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Insult_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Mental_Health_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Mental_Health_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Physical_Harm_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Physical_Harm_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Privacy_And_Property_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Privacy_And_Property_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Prompt_Leaking_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Prompt_Leaking_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Reverse_Exposure_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Reverse_Exposure_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Role_Play_Instruction_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Role_Play_Instruction_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Unfairness_And_Discrimination_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Unfairness_And_Discrimination_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Unsafe_Instruction_Topic_n.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/Unsafe_Instruction_Topic_n.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/commonsense.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/en/commonsense.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Crimes_And_Illegal_Activities.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Crimes_And_Illegal_Activities.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Ethics_And_Morality.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Ethics_And_Morality.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Goal_Hijacking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Goal_Hijacking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Inquiry_With_Unsafe_Opinion.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Inquiry_With_Unsafe_Opinion.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Insult.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Insult.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Mental_Health.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Mental_Health.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Physical_Harm.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Physical_Harm.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Privacy_And_Property.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Privacy_And_Property.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Prompt_Leaking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Prompt_Leaking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Reverse_Exposure.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Reverse_Exposure.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Role_Play_Instruction.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Role_Play_Instruction.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Unfairness_And_Discrimination.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Unfairness_And_Discrimination.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Unsafe_Instruction_Topic.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/Unsafe_Instruction_Topic.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/commonsense.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/fr/commonsense.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Crimes_And_Illegal_Activities.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Crimes_And_Illegal_Activities.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Ethics_And_Morality.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Ethics_And_Morality.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Goal_Hijacking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Goal_Hijacking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Inquiry_With_Unsafe_Opinion.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Inquiry_With_Unsafe_Opinion.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Insult.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Insult.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Mental_Health.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Mental_Health.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Physical_Harm.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Physical_Harm.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Privacy_And_Property.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Privacy_And_Property.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Prompt_Leaking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Prompt_Leaking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Reverse_Exposure.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Reverse_Exposure.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Role_Play_Instruction.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Role_Play_Instruction.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Unfairness_And_Discrimination.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Unfairness_And_Discrimination.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Unsafe_Instruction_Topic.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/Unsafe_Instruction_Topic.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/commen_sense.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/commen_sense.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/commonsense.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/hi/commonsense.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Crimes_And_Illegal_Activities.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Crimes_And_Illegal_Activities.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Ethics_And_Morality.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Ethics_And_Morality.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Goal_Hijacking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Goal_Hijacking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Inquiry_With_Unsafe_Opinion.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Inquiry_With_Unsafe_Opinion.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Insult.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Insult.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Mental_Health.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Mental_Health.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Physical_Harm.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Physical_Harm.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Privacy_And_Property.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Privacy_And_Property.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Prompt_Leaking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Prompt_Leaking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Reverse_Exposure.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Reverse_Exposure.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Role_Play_Instruction.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Role_Play_Instruction.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Unfairness_And_Discrimination.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Unfairness_And_Discrimination.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Unsafe_Instruction_Topic.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/Unsafe_Instruction_Topic.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/commonsense.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ja/commonsense.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/paper/Overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/paper/Overview.png -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/paper/framework.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/paper/framework.jpg -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/paper/frameworks.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/paper/frameworks.pdf -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/paper/result1.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/paper/result1.jpg -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/paper/result2.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/paper/result2.jpg -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Crimes_And_Illegal_Activitie.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Crimes_And_Illegal_Activitie.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Ethics_And_Morality.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Ethics_And_Morality.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Goal_Hijacking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Goal_Hijacking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Inquiry_With_Unsafe_Opinion.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Inquiry_With_Unsafe_Opinion.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Insult.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Insult.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Mental_Health.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Mental_Health.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Physical_Harm.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Physical_Harm.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Privacy_And_Property.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Privacy_And_Property.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Prompt_Leaking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Prompt_Leaking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Reverse_Exposure.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Reverse_Exposure.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Role_Play_Instruction.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Role_Play_Instruction.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Unfairness_And_Discrimination.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Unfairness_And_Discrimination.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Unsafe_Instruction_Topic.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/Unsafe_Instruction_Topic.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/commonsense.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/ru/commonsense.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Crimes_And_Illegal_Activities.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Crimes_And_Illegal_Activities.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Ethics_And_Morality.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Ethics_And_Morality.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Goal_Hijacking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Goal_Hijacking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Inquiry_With_Unsafe_Opinion.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Inquiry_With_Unsafe_Opinion.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Insult.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Insult.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Mental_Health.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Mental_Health.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Physical_Harm.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Physical_Harm.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Privacy_And_Property.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Privacy_And_Property.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Prompt_Leaking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Prompt_Leaking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Reverse_Exposure.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Reverse_Exposure.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Role_Play_Instruction.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Role_Play_Instruction.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Unfairness_And_Discrimination.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Unfairness_And_Discrimination.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Unsafe_Instruction_Topic.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/Unsafe_Instruction_Topic.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/commonsense.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/sp/commonsense.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Crimes_And_Illegal_Activities.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Crimes_And_Illegal_Activities.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Ethics_And_Morality.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Ethics_And_Morality.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Goal_Hijacking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Goal_Hijacking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Inquiry_With_Unsafe_Opinion.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Inquiry_With_Unsafe_Opinion.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Insult.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Insult.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Mental_Health.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Mental_Health.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Physical_Harm.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Physical_Harm.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Privacy_And_Property.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Privacy_And_Property.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Prompt_Leaking.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Prompt_Leaking.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Reverse_Exposure.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Reverse_Exposure.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Role_Play_Instruction.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Role_Play_Instruction.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Unfairness_And_Discrimination.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Unfairness_And_Discrimination.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Unsafe_Instruction_Topic.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/Unsafe_Instruction_Topic.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/commonsense.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/Multilingual_safety_benchmark/zh/commonsense.csv -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/XSafety/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/XSafety/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/aegis_aicontent_safety_dataset/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/aegis_aicontent_safety_dataset/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/aegis_aicontent_safety_dataset/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/aegis_aicontent_safety_dataset/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/aegis_aicontent_safety_dataset/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/aegis_aicontent_safety_dataset/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/air_bench_2024/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/air_bench_2024/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/air_bench_2024/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/air_bench_2024/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/air_bench_2024/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/air_bench_2024/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/gptfuzzer/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/gptfuzzer/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/gptfuzzer/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/gptfuzzer/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/gptfuzzer/prompts.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/gptfuzzer/prompts.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/gptfuzzer/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/gptfuzzer/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/gsm8k/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/gsm8k/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/gsm8k/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/gsm8k/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/jade_db/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/jade_db/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/jade_db/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/jade_db/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/jade_db/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/jade_db/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/jbb_behaviors/classifier.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/jbb_behaviors/classifier.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/jbb_behaviors/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/jbb_behaviors/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/jbb_behaviors/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/jbb_behaviors/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/jbb_behaviors/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/jbb_behaviors/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/llm_jailbreak_study/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/llm_jailbreak_study/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/llm_jailbreak_study/data.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/llm_jailbreak_study/data.json -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/llm_jailbreak_study/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/llm_jailbreak_study/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/llm_jailbreak_study/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/llm_jailbreak_study/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/mmlu/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/mmlu/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/mmlu/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/mmlu/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/s_eval/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/s_eval/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/s_eval/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/s_eval/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/s_eval/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/s_eval/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/salad_bench/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/salad_bench/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/salad_bench/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/salad_bench/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/salad_bench/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/salad_bench/evaluator.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/salad_bench/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/salad_bench/metrics.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/salad_bench/model_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/salad_bench/model_utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/salad_bench/template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/salad_bench/template.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/salad_bench/text_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/salad_bench/text_utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_to_text/salad_bench/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_to_text/salad_bench/utils.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_video_to_text/mmvu/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_video_to_text/mmvu/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_video_to_text/mmvu/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_video_to_text/mmvu/eval.py -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_vision_to_action/chores/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_vision_to_action/chores/configs.yaml -------------------------------------------------------------------------------- /eval_anything/benchmarks/text_vision_to_action/chores/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/benchmarks/text_vision_to_action/chores/eval.py -------------------------------------------------------------------------------- /eval_anything/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/cli.py -------------------------------------------------------------------------------- /eval_anything/configs/evaluate.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_Confaide.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_Confaide.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_DecodingTrust.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_DecodingTrust.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_DoNotAnswer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_DoNotAnswer.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_FakeAlignment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_FakeAlignment.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_Flames.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_Flames.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_HExPHI.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_HExPHI.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_HarmBench.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_HarmBench.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_HarmfulQ.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_HarmfulQ.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_LatentJailbreak.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_LatentJailbreak.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_MaliciousInstruct.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_MaliciousInstruct.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_MaliciousInstructions.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_MaliciousInstructions.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_MoralBench.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_MoralBench.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_RedEval.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_RedEval.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_XSafety.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_XSafety.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_aegis_aicontent_safety_dataset.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_aegis_aicontent_safety_dataset.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_air_bench_2024.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_air_bench_2024.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_deceptionbench.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_deceptionbench.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_gptfuzzer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_gptfuzzer.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_jade_db.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_jade_db.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_jbb_behaviors.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_jbb_behaviors.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_llm_jailbreak_study.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_llm_jailbreak_study.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_s_eval.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_s_eval.yaml -------------------------------------------------------------------------------- /eval_anything/configs/evaluate_salad_bench.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/configs/evaluate_salad_bench.yaml -------------------------------------------------------------------------------- /eval_anything/dataloader/base_dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/dataloader/base_dataloader.py -------------------------------------------------------------------------------- /eval_anything/dataloader/format_mm_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/dataloader/format_mm_dataset.py -------------------------------------------------------------------------------- /eval_anything/dataloader/mm_dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/dataloader/mm_dataloader.py -------------------------------------------------------------------------------- /eval_anything/dataloader/t2t_dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/dataloader/t2t_dataloader.py -------------------------------------------------------------------------------- /eval_anything/dataloader/tv2act_dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/dataloader/tv2act_dataloader.py -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/data/HarmfulQ.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/data/HarmfulQ.json -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/data/MaliciousInstruct.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/data/MaliciousInstruct.txt -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/data/MaliciousInstructions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/data/MaliciousInstructions.json -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/data/harmbench_behaviors_text_all.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/data/harmbench_behaviors_text_all.csv -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/data/latent_jailbreak_data.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/data/latent_jailbreak_data.json -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/jade_db_data/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/jade_db_data/LICENSE -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/jade_db_data/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/jade_db_data/README.md -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/jade_db_data/jade-db-v1.0/jade_benchmark_en.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/jade_db_data/jade-db-v1.0/jade_benchmark_en.csv -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/jade_db_data/jade-db-v1.0/jade_benchmark_zh.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/jade_db_data/jade-db-v1.0/jade_benchmark_zh.csv -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/jade_db_data/jade-db-v2.0/jade_benchmark_easy_zh.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/jade_db_data/jade-db-v2.0/jade_benchmark_easy_zh.csv -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/jade_db_data/jade-db-v2.0/jade_benchmark_medium_zh.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/jade_db_data/jade-db-v2.0/jade_benchmark_medium_zh.csv -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/jade_db_data/jade-db-v3.0/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/jade_db_data/jade-db-v3.0/README.md -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/jade_db_data/jade-db-v3.0/jade_alignment_hard_zh.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/jade_db_data/jade-db-v3.0/jade_alignment_hard_zh.csv -------------------------------------------------------------------------------- /eval_anything/eval-anything-local/jade_db_data/jade-db-v3.0/jade_alignment_medium_zh.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/eval-anything-local/jade_db_data/jade-db-v3.0/jade_alignment_medium_zh.csv -------------------------------------------------------------------------------- /eval_anything/evaluate_tools/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/evaluate_tools/README.md -------------------------------------------------------------------------------- /eval_anything/evaluate_tools/base_tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/evaluate_tools/base_tools.py -------------------------------------------------------------------------------- /eval_anything/evaluate_tools/cached_requests.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/evaluate_tools/cached_requests.py -------------------------------------------------------------------------------- /eval_anything/evaluate_tools/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/evaluate_tools/metrics.py -------------------------------------------------------------------------------- /eval_anything/evaluate_tools/t2t_tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/evaluate_tools/t2t_tools.py -------------------------------------------------------------------------------- /eval_anything/license/add_license.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/license/add_license.py -------------------------------------------------------------------------------- /eval_anything/license/add_third_party.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/license/add_third_party.py -------------------------------------------------------------------------------- /eval_anything/models/api_lm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/models/api_lm.py -------------------------------------------------------------------------------- /eval_anything/models/base_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/models/base_model.py -------------------------------------------------------------------------------- /eval_anything/models/hf_lm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/models/hf_lm.py -------------------------------------------------------------------------------- /eval_anything/models/hf_mm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/models/hf_mm.py -------------------------------------------------------------------------------- /eval_anything/models/hf_vla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/models/hf_vla.py -------------------------------------------------------------------------------- /eval_anything/models/vllm_lm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/models/vllm_lm.py -------------------------------------------------------------------------------- /eval_anything/models/vllm_mm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/models/vllm_mm.py -------------------------------------------------------------------------------- /eval_anything/pipeline/base_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/pipeline/base_benchmark.py -------------------------------------------------------------------------------- /eval_anything/pipeline/base_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/pipeline/base_task.py -------------------------------------------------------------------------------- /eval_anything/pipeline/mm_gen_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/pipeline/mm_gen_benchmark.py -------------------------------------------------------------------------------- /eval_anything/pipeline/mm_und_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/pipeline/mm_und_benchmark.py -------------------------------------------------------------------------------- /eval_anything/pipeline/t2t_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/pipeline/t2t_benchmark.py -------------------------------------------------------------------------------- /eval_anything/pipeline/tv2act_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/pipeline/tv2act_benchmark.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/environment/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/environment/manipulation_sensors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/environment/manipulation_sensors.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/environment/navigation_sensors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/environment/navigation_sensors.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/environment/spoc_objects.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/environment/spoc_objects.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/environment/stretch_controller.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/environment/stretch_controller.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/environment/stretch_state.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/environment/stretch_state.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/environment/vision_sensors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/environment/vision_sensors.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/spoc_model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/spoc_model/__init__.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/spoc_model/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/spoc_model/agent.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/spoc_model/early_fusion_tsfm_models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/spoc_model/early_fusion_tsfm_models.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/spoc_model/preprocessors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/spoc_model/preprocessors.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/spoc_model/text_cond_visual_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/spoc_model/text_cond_visual_encoder.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/tasks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/tasks/__init__.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/tasks/abstract_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/tasks/abstract_task.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/tasks/abstract_task_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/tasks/abstract_task_sampler.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/tasks/fetch_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/tasks/fetch_task.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/tasks/multi_task_eval_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/tasks/multi_task_eval_sampler.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/tasks/object_nav_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/tasks/object_nav_task.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/tasks/pickup_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/tasks/pickup_task.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/tasks/room_nav_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/tasks/room_nav_task.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/tasks/room_visit_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/tasks/room_visit_task.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/tasks/safety_components.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/tasks/safety_components.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/tasks/task_specs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/tasks/task_specs.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/constants/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/constants/objaverse_data_dirs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/constants/objaverse_data_dirs.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/constants/object_constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/constants/object_constants.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/constants/stretch_initialization_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/constants/stretch_initialization_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/constants/template_verbs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/constants/template_verbs.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/data_generation_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/data_generation_utils/mp4_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/data_generation_utils/mp4_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/data_generation_utils/navigation_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/data_generation_utils/navigation_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/distance_calculation_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/distance_calculation_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/objaverse_annotation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/objaverse_annotation.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/online_evaluation_types_and_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/online_evaluation_types_and_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/reward_shaper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/reward_shaper.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/sel_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/sel_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/sensor_constant_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/sensor_constant_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/string_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/string_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/synset_to_best_lemma.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/synset_to_best_lemma.json -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/synset_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/synset_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/task_datagen_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/task_datagen_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/task_spec_to_instruction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/task_spec_to_instruction.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/task_type_mapping_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/task_type_mapping_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/transformation_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/transformation_util.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/type_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/type_utils.py -------------------------------------------------------------------------------- /eval_anything/third_party/SPOC/utils/visualization_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/third_party/SPOC/utils/visualization_utils.py -------------------------------------------------------------------------------- /eval_anything/utils/cache_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/utils/cache_manager.py -------------------------------------------------------------------------------- /eval_anything/utils/cached_requests.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/utils/cached_requests.py -------------------------------------------------------------------------------- /eval_anything/utils/data_type.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/utils/data_type.py -------------------------------------------------------------------------------- /eval_anything/utils/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/utils/logger.py -------------------------------------------------------------------------------- /eval_anything/utils/mm_data_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/utils/mm_data_manager.py -------------------------------------------------------------------------------- /eval_anything/utils/prompt_builders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/utils/prompt_builders.py -------------------------------------------------------------------------------- /eval_anything/utils/register.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/utils/register.py -------------------------------------------------------------------------------- /eval_anything/utils/template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/utils/template.py -------------------------------------------------------------------------------- /eval_anything/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/utils/utils.py -------------------------------------------------------------------------------- /eval_anything/utils/uuid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/utils/uuid.py -------------------------------------------------------------------------------- /eval_anything/version.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/eval_anything/version.py -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/pyproject.toml -------------------------------------------------------------------------------- /scripts/download_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/download_dataset.py -------------------------------------------------------------------------------- /scripts/download_objaverse_houses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/download_objaverse_houses.py -------------------------------------------------------------------------------- /scripts/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run.sh -------------------------------------------------------------------------------- /scripts/run_Confaide.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_Confaide.sh -------------------------------------------------------------------------------- /scripts/run_DecodingTrust.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_DecodingTrust.sh -------------------------------------------------------------------------------- /scripts/run_DoNotAnswer.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_DoNotAnswer.sh -------------------------------------------------------------------------------- /scripts/run_Flames.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_Flames.sh -------------------------------------------------------------------------------- /scripts/run_HExPHI.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_HExPHI.sh -------------------------------------------------------------------------------- /scripts/run_HarmBench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_HarmBench.sh -------------------------------------------------------------------------------- /scripts/run_LatentJailbreak.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_LatentJailbreak.sh -------------------------------------------------------------------------------- /scripts/run_MoralBench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_MoralBench.sh -------------------------------------------------------------------------------- /scripts/run_RedEval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_RedEval.sh -------------------------------------------------------------------------------- /scripts/run_XSafety.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_XSafety.sh -------------------------------------------------------------------------------- /scripts/run_deceptionbench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_deceptionbench.sh -------------------------------------------------------------------------------- /scripts/run_jade_db.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_jade_db.sh -------------------------------------------------------------------------------- /scripts/run_vla.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/scripts/run_vla.sh -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PKU-Alignment/eval-anything/HEAD/setup.py --------------------------------------------------------------------------------