├── README.md └── code ├── evaluation ├── eval_baseline_scripts │ ├── evaluation1.py │ ├── evaluation2.py │ ├── evaluation3.py │ ├── evaluation4.py │ ├── evaluation5.py │ ├── evaluation6.py │ ├── evaluation7.py │ ├── evaluation8.py │ └── evaluation9.py ├── eval_jailbreak_scripts │ ├── evaluation.py │ ├── evaluation1.py │ ├── evaluation2.py │ ├── evaluation3.py │ ├── evaluation4.py │ ├── evaluation5.py │ ├── evaluation6.py │ ├── evaluation7.py │ ├── evaluation8.py │ └── evaluation9.py ├── statistic.py └── statistic_results │ ├── baseline │ ├── Llama3_llava_next_8b_hf │ │ ├── 01-Illegal_Activitiy.json │ │ ├── 02-HateSpeech.json │ │ ├── 03-Malware_Generation.json │ │ ├── 04-Physical_Harm.json │ │ ├── 06-Fraud.json │ │ ├── 07-Sex.json │ │ ├── 09-Privacy_Violence.json │ │ ├── 10-Legal_Opinion.json │ │ ├── 11-Financial_Advice.json │ │ └── 12-Health_Consultation.json │ ├── Llama_3_2_11B_Vision_Instruct │ │ ├── 01-Illegal_Activitiy.json │ │ ├── 02-HateSpeech.json │ │ ├── 03-Malware_Generation.json │ │ ├── 04-Physical_Harm.json │ │ ├── 06-Fraud.json │ │ ├── 07-Sex.json │ │ ├── 09-Privacy_Violence.json │ │ ├── 10-Legal_Opinion.json │ │ ├── 11-Financial_Advice.json │ │ └── 12-Health_Consultation.json │ ├── MM_Eureka_Qwen_7B │ │ ├── 01-Illegal_Activitiy.json │ │ ├── 02-HateSpeech.json │ │ ├── 03-Malware_Generation.json │ │ ├── 04-Physical_Harm.json │ │ ├── 06-Fraud.json │ │ ├── 07-Sex.json │ │ ├── 09-Privacy_Violence.json │ │ ├── 10-Legal_Opinion.json │ │ ├── 11-Financial_Advice.json │ │ └── 12-Health_Consultation.json │ ├── Mulberry_llama_11b │ │ ├── 01-Illegal_Activitiy.json │ │ ├── 02-HateSpeech.json │ │ ├── 03-Malware_Generation.json │ │ ├── 04-Physical_Harm.json │ │ ├── 06-Fraud.json │ │ ├── 07-Sex.json │ │ ├── 09-Privacy_Violence.json │ │ ├── 10-Legal_Opinion.json │ │ ├── 11-Financial_Advice.json │ │ └── 12-Health_Consultation.json │ ├── Mulberry_llava_8b │ │ ├── 01-Illegal_Activitiy.json │ │ ├── 02-HateSpeech.json │ │ ├── 03-Malware_Generation.json │ │ ├── 04-Physical_Harm.json │ │ ├── 06-Fraud.json │ │ ├── 07-Sex.json │ │ ├── 09-Privacy_Violence.json │ │ ├── 10-Legal_Opinion.json │ │ ├── 11-Financial_Advice.json │ │ └── 12-Health_Consultation.json │ ├── Mulberry_qwen2vl_7b │ │ ├── 01-Illegal_Activitiy.json │ │ ├── 02-HateSpeech.json │ │ ├── 03-Malware_Generation.json │ │ ├── 04-Physical_Harm.json │ │ ├── 06-Fraud.json │ │ ├── 07-Sex.json │ │ ├── 09-Privacy_Violence.json │ │ ├── 10-Legal_Opinion.json │ │ ├── 11-Financial_Advice.json │ │ └── 12-Health_Consultation.json │ ├── Qwen2_5_VL_7B_Instruct │ │ ├── 01-Illegal_Activitiy.json │ │ ├── 02-HateSpeech.json │ │ ├── 03-Malware_Generation.json │ │ ├── 04-Physical_Harm.json │ │ ├── 06-Fraud.json │ │ ├── 07-Sex.json │ │ ├── 09-Privacy_Violence.json │ │ ├── 10-Legal_Opinion.json │ │ ├── 11-Financial_Advice.json │ │ └── 12-Health_Consultation.json │ ├── Qwen2_VL_7B_Instruct │ │ ├── 01-Illegal_Activitiy.json │ │ ├── 02-HateSpeech.json │ │ ├── 03-Malware_Generation.json │ │ ├── 04-Physical_Harm.json │ │ ├── 06-Fraud.json │ │ ├── 07-Sex.json │ │ ├── 09-Privacy_Violence.json │ │ ├── 10-Legal_Opinion.json │ │ ├── 11-Financial_Advice.json │ │ └── 12-Health_Consultation.json │ ├── R1_Onevision_7B │ │ ├── 01-Illegal_Activitiy.json │ │ ├── 02-HateSpeech.json │ │ ├── 03-Malware_Generation.json │ │ ├── 04-Physical_Harm.json │ │ ├── 06-Fraud.json │ │ ├── 07-Sex.json │ │ ├── 09-Privacy_Violence.json │ │ ├── 10-Legal_Opinion.json │ │ ├── 11-Financial_Advice.json │ │ └── 12-Health_Consultation.json │ └── memo.py │ └── jailbreak_method │ ├── Llama3_llava_next_8b_hf │ ├── 01-Illegal_Activitiy.json │ ├── 02-HateSpeech.json │ ├── 03-Malware_Generation.json │ ├── 04-Physical_Harm.json │ ├── 06-Fraud.json │ ├── 07-Sex.json │ ├── 09-Privacy_Violence.json │ ├── 10-Legal_Opinion.json │ ├── 11-Financial_Advice.json │ └── 12-Health_Consultation.json │ ├── Llama_3_2_11B_Vision_Instruct │ ├── 01-Illegal_Activitiy.json │ ├── 02-HateSpeech.json │ ├── 03-Malware_Generation.json │ ├── 04-Physical_Harm.json │ ├── 06-Fraud.json │ ├── 07-Sex.json │ ├── 09-Privacy_Violence.json │ ├── 10-Legal_Opinion.json │ ├── 11-Financial_Advice.json │ └── 12-Health_Consultation.json │ ├── MM_Eureka_Qwen_7B │ ├── 01-Illegal_Activitiy.json │ ├── 02-HateSpeech.json │ ├── 03-Malware_Generation.json │ ├── 04-Physical_Harm.json │ ├── 06-Fraud.json │ ├── 07-Sex.json │ ├── 09-Privacy_Violence.json │ ├── 10-Legal_Opinion.json │ ├── 11-Financial_Advice.json │ └── 12-Health_Consultation.json │ ├── Mulberry_llama_11b │ ├── 01-Illegal_Activitiy.json │ ├── 02-HateSpeech.json │ ├── 03-Malware_Generation.json │ ├── 04-Physical_Harm.json │ ├── 06-Fraud.json │ ├── 07-Sex.json │ ├── 09-Privacy_Violence.json │ ├── 10-Legal_Opinion.json │ ├── 11-Financial_Advice.json │ └── 12-Health_Consultation.json │ ├── Mulberry_llava_8b │ ├── 01-Illegal_Activitiy.json │ ├── 02-HateSpeech.json │ ├── 03-Malware_Generation.json │ ├── 04-Physical_Harm.json │ ├── 06-Fraud.json │ ├── 07-Sex.json │ ├── 09-Privacy_Violence.json │ ├── 10-Legal_Opinion.json │ ├── 11-Financial_Advice.json │ └── 12-Health_Consultation.json │ ├── Mulberry_qwen2vl_7b │ ├── 01-Illegal_Activitiy.json │ ├── 02-HateSpeech.json │ ├── 03-Malware_Generation.json │ ├── 04-Physical_Harm.json │ ├── 06-Fraud.json │ ├── 07-Sex.json │ ├── 09-Privacy_Violence.json │ ├── 10-Legal_Opinion.json │ ├── 11-Financial_Advice.json │ └── 12-Health_Consultation.json │ ├── Qwen2_5_VL_7B_Instruct │ ├── 01-Illegal_Activitiy.json │ ├── 02-HateSpeech.json │ ├── 03-Malware_Generation.json │ ├── 04-Physical_Harm.json │ ├── 06-Fraud.json │ ├── 07-Sex.json │ ├── 09-Privacy_Violence.json │ ├── 10-Legal_Opinion.json │ ├── 11-Financial_Advice.json │ └── 12-Health_Consultation.json │ ├── Qwen2_VL_7B_Instruct │ ├── 01-Illegal_Activitiy.json │ ├── 02-HateSpeech.json │ ├── 03-Malware_Generation.json │ ├── 04-Physical_Harm.json │ ├── 06-Fraud.json │ ├── 07-Sex.json │ ├── 09-Privacy_Violence.json │ ├── 10-Legal_Opinion.json │ ├── 11-Financial_Advice.json │ └── 12-Health_Consultation.json │ ├── R1_Onevision_7B │ ├── 01-Illegal_Activitiy.json │ ├── 02-HateSpeech.json │ ├── 03-Malware_Generation.json │ ├── 04-Physical_Harm.json │ ├── 06-Fraud.json │ ├── 07-Sex.json │ ├── 09-Privacy_Violence.json │ ├── 10-Legal_Opinion.json │ ├── 11-Financial_Advice.json │ └── 12-Health_Consultation.json │ └── memo.txt └── exp_on_MM-SafeBench ├── demo.jpeg ├── exp1.py ├── exp2.py ├── exp3.py ├── exp4.py ├── exp5.py └── exp6.py /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/README.md -------------------------------------------------------------------------------- /code/evaluation/eval_baseline_scripts/evaluation1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_baseline_scripts/evaluation1.py -------------------------------------------------------------------------------- /code/evaluation/eval_baseline_scripts/evaluation2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_baseline_scripts/evaluation2.py -------------------------------------------------------------------------------- /code/evaluation/eval_baseline_scripts/evaluation3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_baseline_scripts/evaluation3.py -------------------------------------------------------------------------------- /code/evaluation/eval_baseline_scripts/evaluation4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_baseline_scripts/evaluation4.py -------------------------------------------------------------------------------- /code/evaluation/eval_baseline_scripts/evaluation5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_baseline_scripts/evaluation5.py -------------------------------------------------------------------------------- /code/evaluation/eval_baseline_scripts/evaluation6.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_baseline_scripts/evaluation6.py -------------------------------------------------------------------------------- /code/evaluation/eval_baseline_scripts/evaluation7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_baseline_scripts/evaluation7.py -------------------------------------------------------------------------------- /code/evaluation/eval_baseline_scripts/evaluation8.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_baseline_scripts/evaluation8.py -------------------------------------------------------------------------------- /code/evaluation/eval_baseline_scripts/evaluation9.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_baseline_scripts/evaluation9.py -------------------------------------------------------------------------------- /code/evaluation/eval_jailbreak_scripts/evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_jailbreak_scripts/evaluation.py -------------------------------------------------------------------------------- /code/evaluation/eval_jailbreak_scripts/evaluation1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_jailbreak_scripts/evaluation1.py -------------------------------------------------------------------------------- /code/evaluation/eval_jailbreak_scripts/evaluation2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_jailbreak_scripts/evaluation2.py -------------------------------------------------------------------------------- /code/evaluation/eval_jailbreak_scripts/evaluation3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_jailbreak_scripts/evaluation3.py -------------------------------------------------------------------------------- /code/evaluation/eval_jailbreak_scripts/evaluation4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_jailbreak_scripts/evaluation4.py -------------------------------------------------------------------------------- /code/evaluation/eval_jailbreak_scripts/evaluation5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_jailbreak_scripts/evaluation5.py -------------------------------------------------------------------------------- /code/evaluation/eval_jailbreak_scripts/evaluation6.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_jailbreak_scripts/evaluation6.py -------------------------------------------------------------------------------- /code/evaluation/eval_jailbreak_scripts/evaluation7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_jailbreak_scripts/evaluation7.py -------------------------------------------------------------------------------- /code/evaluation/eval_jailbreak_scripts/evaluation8.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_jailbreak_scripts/evaluation8.py -------------------------------------------------------------------------------- /code/evaluation/eval_jailbreak_scripts/evaluation9.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/eval_jailbreak_scripts/evaluation9.py -------------------------------------------------------------------------------- /code/evaluation/statistic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic.py -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama3_llava_next_8b_hf/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Llama_3_2_11B_Vision_Instruct/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/MM_Eureka_Qwen_7B/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llama_11b/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llama_11b/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llama_11b/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llama_11b/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llama_11b/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llama_11b/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llama_11b/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llama_11b/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llama_11b/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llama_11b/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llama_11b/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llama_11b/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llama_11b/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llama_11b/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llama_11b/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llama_11b/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llama_11b/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llama_11b/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llama_11b/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llama_11b/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llava_8b/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llava_8b/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llava_8b/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llava_8b/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llava_8b/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llava_8b/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llava_8b/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llava_8b/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llava_8b/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llava_8b/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llava_8b/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llava_8b/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llava_8b/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llava_8b/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llava_8b/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llava_8b/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llava_8b/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llava_8b/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_llava_8b/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_llava_8b/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Mulberry_qwen2vl_7b/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_5_VL_7B_Instruct/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/Qwen2_VL_7B_Instruct/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/R1_Onevision_7B/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/R1_Onevision_7B/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/R1_Onevision_7B/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/R1_Onevision_7B/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/R1_Onevision_7B/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/R1_Onevision_7B/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/R1_Onevision_7B/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/R1_Onevision_7B/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/R1_Onevision_7B/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/R1_Onevision_7B/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/R1_Onevision_7B/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/R1_Onevision_7B/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/R1_Onevision_7B/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/R1_Onevision_7B/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/R1_Onevision_7B/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/R1_Onevision_7B/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/R1_Onevision_7B/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/R1_Onevision_7B/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/R1_Onevision_7B/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/R1_Onevision_7B/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/baseline/memo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/baseline/memo.py -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama3_llava_next_8b_hf/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Llama_3_2_11B_Vision_Instruct/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/MM_Eureka_Qwen_7B/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llama_11b/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_llava_8b/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Mulberry_qwen2vl_7b/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_5_VL_7B_Instruct/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/Qwen2_VL_7B_Instruct/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/01-Illegal_Activitiy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/01-Illegal_Activitiy.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/02-HateSpeech.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/02-HateSpeech.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/03-Malware_Generation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/03-Malware_Generation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/04-Physical_Harm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/04-Physical_Harm.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/06-Fraud.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/06-Fraud.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/07-Sex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/07-Sex.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/09-Privacy_Violence.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/09-Privacy_Violence.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/10-Legal_Opinion.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/10-Legal_Opinion.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/11-Financial_Advice.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/11-Financial_Advice.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/12-Health_Consultation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/R1_Onevision_7B/12-Health_Consultation.json -------------------------------------------------------------------------------- /code/evaluation/statistic_results/jailbreak_method/memo.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/evaluation/statistic_results/jailbreak_method/memo.txt -------------------------------------------------------------------------------- /code/exp_on_MM-SafeBench/demo.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/exp_on_MM-SafeBench/demo.jpeg -------------------------------------------------------------------------------- /code/exp_on_MM-SafeBench/exp1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/exp_on_MM-SafeBench/exp1.py -------------------------------------------------------------------------------- /code/exp_on_MM-SafeBench/exp2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/exp_on_MM-SafeBench/exp2.py -------------------------------------------------------------------------------- /code/exp_on_MM-SafeBench/exp3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/exp_on_MM-SafeBench/exp3.py -------------------------------------------------------------------------------- /code/exp_on_MM-SafeBench/exp4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/exp_on_MM-SafeBench/exp4.py -------------------------------------------------------------------------------- /code/exp_on_MM-SafeBench/exp5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/exp_on_MM-SafeBench/exp5.py -------------------------------------------------------------------------------- /code/exp_on_MM-SafeBench/exp6.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/fangjf1/OpenSafeMLRM/HEAD/code/exp_on_MM-SafeBench/exp6.py --------------------------------------------------------------------------------