├── .gitignore ├── LICENSE.md ├── README.md ├── assets ├── pmpd_illustration_hf.png └── pmpd_npu_perf_comparison.png ├── pmpd ├── __init__.py ├── application │ └── demo.py ├── eval │ ├── anyprec │ │ ├── mobilellama │ │ │ ├── eval_cnn_dm.sh │ │ │ ├── eval_dsum.sh │ │ │ ├── eval_gsm8k.sh │ │ │ ├── eval_mt_bench.sh │ │ │ ├── eval_passkey.sh │ │ │ ├── eval_strategyqa.sh │ │ │ └── eval_translation.sh │ │ ├── phi │ │ │ ├── eval_cnn_dm.sh │ │ │ ├── eval_dsum.sh │ │ │ ├── eval_gsm8k.sh │ │ │ ├── eval_mt_bench.sh │ │ │ ├── eval_passkey.sh │ │ │ └── eval_translation.sh │ │ ├── qwen │ │ │ └── eval_mt_bench.sh │ │ ├── vicuna │ │ │ ├── eval_cnn_dm.sh │ │ │ ├── eval_dsum.sh │ │ │ ├── eval_mt_bench.sh │ │ │ └── eval_translation.sh │ │ └── zephyr │ │ │ ├── eval_cnn_dm.sh │ │ │ ├── eval_dsum.sh │ │ │ ├── eval_mt_bench.sh │ │ │ └── eval_translation.sh │ ├── eval.py │ ├── evaluate_generation.py │ └── get_score.py ├── modules │ ├── __init__.py │ ├── model.py │ ├── scheduler │ │ ├── __init__.py │ │ ├── act_scheduler.py │ │ ├── confidence_scheduler.py │ │ ├── kv_cache_scheduler.py │ │ ├── naive_scheduler.py │ │ ├── random_scheduler.py │ │ └── scheduler.py │ └── zoo.py └── train │ ├── generate_train_dataset.py │ ├── hypertune.py │ ├── train.sh │ └── train_scheduler.py ├── requirements.txt └── setup.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/LICENSE.md -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/README.md -------------------------------------------------------------------------------- /assets/pmpd_illustration_hf.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/assets/pmpd_illustration_hf.png -------------------------------------------------------------------------------- /assets/pmpd_npu_perf_comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/assets/pmpd_npu_perf_comparison.png -------------------------------------------------------------------------------- /pmpd/__init__.py: -------------------------------------------------------------------------------- 1 | from .modules import * -------------------------------------------------------------------------------- /pmpd/application/demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/application/demo.py -------------------------------------------------------------------------------- /pmpd/eval/anyprec/mobilellama/eval_cnn_dm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/mobilellama/eval_cnn_dm.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/mobilellama/eval_dsum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/mobilellama/eval_dsum.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/mobilellama/eval_gsm8k.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/mobilellama/eval_gsm8k.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/mobilellama/eval_mt_bench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/mobilellama/eval_mt_bench.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/mobilellama/eval_passkey.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/mobilellama/eval_passkey.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/mobilellama/eval_strategyqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/mobilellama/eval_strategyqa.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/mobilellama/eval_translation.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/mobilellama/eval_translation.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/phi/eval_cnn_dm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/phi/eval_cnn_dm.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/phi/eval_dsum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/phi/eval_dsum.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/phi/eval_gsm8k.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/phi/eval_gsm8k.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/phi/eval_mt_bench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/phi/eval_mt_bench.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/phi/eval_passkey.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/phi/eval_passkey.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/phi/eval_translation.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/phi/eval_translation.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/qwen/eval_mt_bench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/qwen/eval_mt_bench.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/vicuna/eval_cnn_dm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/vicuna/eval_cnn_dm.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/vicuna/eval_dsum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/vicuna/eval_dsum.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/vicuna/eval_mt_bench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/vicuna/eval_mt_bench.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/vicuna/eval_translation.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/vicuna/eval_translation.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/zephyr/eval_cnn_dm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/zephyr/eval_cnn_dm.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/zephyr/eval_dsum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/zephyr/eval_dsum.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/zephyr/eval_mt_bench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/zephyr/eval_mt_bench.sh -------------------------------------------------------------------------------- /pmpd/eval/anyprec/zephyr/eval_translation.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/anyprec/zephyr/eval_translation.sh -------------------------------------------------------------------------------- /pmpd/eval/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/eval.py -------------------------------------------------------------------------------- /pmpd/eval/evaluate_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/evaluate_generation.py -------------------------------------------------------------------------------- /pmpd/eval/get_score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/eval/get_score.py -------------------------------------------------------------------------------- /pmpd/modules/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/modules/__init__.py -------------------------------------------------------------------------------- /pmpd/modules/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/modules/model.py -------------------------------------------------------------------------------- /pmpd/modules/scheduler/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/modules/scheduler/__init__.py -------------------------------------------------------------------------------- /pmpd/modules/scheduler/act_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/modules/scheduler/act_scheduler.py -------------------------------------------------------------------------------- /pmpd/modules/scheduler/confidence_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/modules/scheduler/confidence_scheduler.py -------------------------------------------------------------------------------- /pmpd/modules/scheduler/kv_cache_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/modules/scheduler/kv_cache_scheduler.py -------------------------------------------------------------------------------- /pmpd/modules/scheduler/naive_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/modules/scheduler/naive_scheduler.py -------------------------------------------------------------------------------- /pmpd/modules/scheduler/random_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/modules/scheduler/random_scheduler.py -------------------------------------------------------------------------------- /pmpd/modules/scheduler/scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/modules/scheduler/scheduler.py -------------------------------------------------------------------------------- /pmpd/modules/zoo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/modules/zoo.py -------------------------------------------------------------------------------- /pmpd/train/generate_train_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/train/generate_train_dataset.py -------------------------------------------------------------------------------- /pmpd/train/hypertune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/train/hypertune.py -------------------------------------------------------------------------------- /pmpd/train/train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/train/train.sh -------------------------------------------------------------------------------- /pmpd/train/train_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/pmpd/train/train_scheduler.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/requirements.txt -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SamsungLabs/PMPD/HEAD/setup.py --------------------------------------------------------------------------------