├── .gitignore
├── README.md
├── baselines
    ├── Copilot
    │   ├── README.md
    │   ├── api.py
    │   ├── output
    │   │   ├── APPS
    │   │   │   ├── completion_0.pkl
    │   │   │   ├── completion_1.pkl
    │   │   │   ├── completion_2.pkl
    │   │   │   ├── completion_3.pkl
    │   │   │   ├── completion_4.pkl
    │   │   │   ├── prediction_from_file_rank0_multi0.log
    │   │   │   ├── prediction_from_file_rank0_single3.log
    │   │   │   └── prediction_from_file_rank0_single5.log
    │   │   ├── HumanEval
    │   │   │   ├── completion_0.pkl
    │   │   │   ├── completion_1.pkl
    │   │   │   ├── completion_2.pkl
    │   │   │   ├── completion_3.pkl
    │   │   │   ├── completion_4.pkl
    │   │   │   ├── prediction_from_file_rank0_multi0.log
    │   │   │   ├── prediction_from_file_rank0_single3.log
    │   │   │   └── prediction_from_file_rank0_single5.log
    │   │   └── MBPP
    │   │   │   ├── completion_0.pkl
    │   │   │   ├── completion_1.pkl
    │   │   │   ├── completion_2.pkl
    │   │   │   ├── completion_3.pkl
    │   │   │   ├── completion_4.pkl
    │   │   │   ├── prediction_from_file_rank0_multi0.log
    │   │   │   ├── prediction_from_file_rank0_single3.log
    │   │   │   └── prediction_from_file_rank0_single5.log
    │   ├── query_apps.py
    │   ├── query_humaneval.py
    │   └── query_mbpp.py
    ├── Finetune CodeT5
    │   ├── README.md
    │   └── output
    │   │   ├── APPS
    │   │       ├── prediction-5_beam.pkl
    │   │       └── prediction_from_file.log
    │   │   ├── HumanEval
    │   │       ├── prediction-5_beam300_full.pkl
    │   │       ├── prediction_from_file_rank0_multi0.log
    │   │       ├── prediction_from_file_rank0_single3.log
    │   │       └── prediction_from_file_rank0_single5.log
    │   │   └── MBPP
    │   │       ├── prediction-5_beam300_full.pkl
    │   │       ├── prediction_from_file_rank0_multi0.log
    │   │       ├── prediction_from_file_rank0_single3.log
    │   │       └── prediction_from_file_rank0_single5.log
    ├── GPT-3.5
    │   ├── OpenAI.py
    │   └── output
    │   │   ├── APPS
    │   │       ├── openai_gpt35_apps_testcase_n5_seed42_0613_executable.json
    │   │       ├── prediction_from_file_rank0_multi0.log
    │   │       ├── prediction_from_file_rank0_single3.log
    │   │       ├── prediction_from_file_rank0_single5.log
    │   │       ├── prediction_from_file_rank1_multi0.log
    │   │       ├── prediction_from_file_rank1_single3.log
    │   │       ├── prediction_from_file_rank1_single5.log
    │   │       ├── prediction_from_file_rank2_multi0.log
    │   │       ├── prediction_from_file_rank2_single3.log
    │   │       ├── prediction_from_file_rank2_single5.log
    │   │       ├── prediction_from_file_rank3_multi0.log
    │   │       ├── prediction_from_file_rank3_single3.log
    │   │       ├── prediction_from_file_rank3_single5.log
    │   │       ├── prediction_from_file_rank4_multi0.log
    │   │       ├── prediction_from_file_rank4_single3.log
    │   │       └── prediction_from_file_rank4_single5.log
    │   │   ├── HumanEval
    │   │       ├── openai_gpt35_humaneval_testcase_n5_seed42_1106_full.json
    │   │       ├── prediction_from_file_rank0_multi0.log
    │   │       ├── prediction_from_file_rank0_single3.log
    │   │       ├── prediction_from_file_rank0_single5.log
    │   │       ├── prediction_from_file_rank1_multi0.log
    │   │       ├── prediction_from_file_rank1_single3.log
    │   │       ├── prediction_from_file_rank1_single5.log
    │   │       ├── prediction_from_file_rank2_multi0.log
    │   │       ├── prediction_from_file_rank2_single3.log
    │   │       ├── prediction_from_file_rank2_single5.log
    │   │       ├── prediction_from_file_rank3_multi0.log
    │   │       ├── prediction_from_file_rank3_single3.log
    │   │       ├── prediction_from_file_rank3_single5.log
    │   │       ├── prediction_from_file_rank4_multi0.log
    │   │       ├── prediction_from_file_rank4_single3.log
    │   │       └── prediction_from_file_rank4_single5.log
    │   │   └── MBPP
    │   │       ├── openai_gpt35_mbpp_testcase_n5_seed42_1106_full.json
    │   │       ├── prediction_from_file_rank0_multi0.log
    │   │       ├── prediction_from_file_rank0_single3.log
    │   │       ├── prediction_from_file_rank0_single5.log
    │   │       ├── prediction_from_file_rank1_multi0.log
    │   │       ├── prediction_from_file_rank1_single3.log
    │   │       ├── prediction_from_file_rank1_single5.log
    │   │       ├── prediction_from_file_rank2_multi0.log
    │   │       ├── prediction_from_file_rank2_single3.log
    │   │       ├── prediction_from_file_rank2_single5.log
    │   │       ├── prediction_from_file_rank3_multi0.log
    │   │       ├── prediction_from_file_rank3_single3.log
    │   │       ├── prediction_from_file_rank3_single5.log
    │   │       ├── prediction_from_file_rank4_multi0.log
    │   │       ├── prediction_from_file_rank4_single3.log
    │   │       └── prediction_from_file_rank4_single5.log
    ├── InCoder
    │   ├── InCoder-6B.py
    │   └── output
    │   │   ├── APPS
    │   │       ├── incoder-6B_apps_testcase_beam_executable.json
    │   │       └── prediction_from_file.log
    │   │   ├── HumanEval
    │   │       ├── incoder-6B_humaneval_testcase_beam_full.json
    │   │       ├── prediction_from_file_rank0_multi0.log
    │   │       ├── prediction_from_file_rank0_single3.log
    │   │       └── prediction_from_file_rank0_single5.log
    │   │   └── MBPP
    │   │       ├── incoder-6B_mbpp_testcase_beam_full.json
    │   │       ├── prediction_from_file_rank0_multi0.log
    │   │       ├── prediction_from_file_rank0_single3.log
    │   │       └── prediction_from_file_rank0_single5.log
    ├── Pynguin
    │   ├── 1_arrange_datasets.ipynb
    │   ├── 2_pynguin_apps.sh
    │   ├── 2_pynguin_humaneval.sh
    │   ├── 2_pynguin_mbpp.sh
    │   ├── README.md
    │   ├── coverage_note.txt
    │   ├── evaluate_results_pynguin.ipynb
    │   └── output
    │   │   ├── HumanEval
    │   │       ├── coverage_humaneval_3.json
    │   │       ├── coverage_humaneval_5.json
    │   │       ├── coverage_humaneval_perfect.json
    │   │       ├── mutation_humaneval.sh
    │   │       ├── mutation_humaneval_3.txt
    │   │       ├── mutation_humaneval_5.txt
    │   │       └── mutation_humaneval_perfect.txt
    │   │   └── MBPP
    │   │       ├── coverage_mbpp_3.json
    │   │       ├── coverage_mbpp_5.json
    │   │       ├── coverage_mbpp_perfect.json
    │   │       ├── mutation_mbpp.sh
    │   │       ├── mutation_mbpp_3.txt
    │   │       ├── mutation_mbpp_5.txt
    │   │       └── mutation_mbpp_perfect.txt
    └── StarCoder
    │   ├── StarCoder.py
    │   └── output
    │       ├── APPS
    │           ├── prediction_from_file.log
    │           └── starcoder_apps_testcase_beam_executable.json
    │       ├── HumanEval
    │           ├── prediction_from_file_rank0_multi0.log
    │           ├── prediction_from_file_rank0_single3.log
    │           ├── prediction_from_file_rank0_single5.log
    │           └── starcoder_humaneval_testcase_beam_full.json
    │       └── MBPP
    │           ├── prediction_from_file_rank0_multi0.log
    │           ├── prediction_from_file_rank0_single3.log
    │           ├── prediction_from_file_rank0_single5.log
    │           └── starcoder_mbpp_testcase_beam_full.json
├── datasets
    ├── HumanEval
    │   └── humaneval_test.csv
    └── MBPP
    │   └── mbpp_test.csv
├── evaluation.py
├── finetuning.py
├── handlers
    ├── __init__.py
    ├── code_processing.py
    ├── literals.json
    ├── python_terminal_command.py
    ├── testing_util.py
    ├── testing_util_v2.py
    └── utils.py
├── inference.py
├── ppo_training.py
├── requirements.txt
└── results
    ├── APPS
        ├── prediction-5_beam300.pkl
        ├── prediction.log
        └── prediction_from_file.log
    ├── HumanEval
        ├── prediction-5_beam300_full.pkl
        ├── prediction_from_file_rank0_multi0.log
        ├── prediction_from_file_rank0_single3.log
        └── prediction_from_file_rank0_single5.log
    └── MBPP
        ├── prediction-5_beam300_full.pkl
        ├── prediction_from_file_rank0_multi0.log
        ├── prediction_from_file_rank0_single3.log
        └── prediction_from_file_rank0_single5.log


/.gitignore:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/.gitignore


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/README.md


--------------------------------------------------------------------------------
/baselines/Copilot/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/README.md


--------------------------------------------------------------------------------
/baselines/Copilot/api.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/api.py


--------------------------------------------------------------------------------
/baselines/Copilot/output/APPS/completion_0.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/APPS/completion_0.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/APPS/completion_1.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/APPS/completion_1.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/APPS/completion_2.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/APPS/completion_2.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/APPS/completion_3.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/APPS/completion_3.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/APPS/completion_4.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/APPS/completion_4.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/APPS/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/APPS/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/Copilot/output/APPS/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/APPS/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/Copilot/output/APPS/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/APPS/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/Copilot/output/HumanEval/completion_0.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/HumanEval/completion_0.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/HumanEval/completion_1.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/HumanEval/completion_1.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/HumanEval/completion_2.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/HumanEval/completion_2.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/HumanEval/completion_3.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/HumanEval/completion_3.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/HumanEval/completion_4.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/HumanEval/completion_4.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/HumanEval/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/HumanEval/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/Copilot/output/HumanEval/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/HumanEval/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/Copilot/output/HumanEval/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/HumanEval/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/Copilot/output/MBPP/completion_0.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/MBPP/completion_0.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/MBPP/completion_1.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/MBPP/completion_1.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/MBPP/completion_2.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/MBPP/completion_2.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/MBPP/completion_3.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/MBPP/completion_3.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/MBPP/completion_4.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/MBPP/completion_4.pkl


--------------------------------------------------------------------------------
/baselines/Copilot/output/MBPP/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/MBPP/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/Copilot/output/MBPP/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/MBPP/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/Copilot/output/MBPP/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/output/MBPP/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/Copilot/query_apps.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/query_apps.py


--------------------------------------------------------------------------------
/baselines/Copilot/query_humaneval.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/query_humaneval.py


--------------------------------------------------------------------------------
/baselines/Copilot/query_mbpp.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Copilot/query_mbpp.py


--------------------------------------------------------------------------------
/baselines/Finetune CodeT5/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Finetune CodeT5/README.md


--------------------------------------------------------------------------------
/baselines/Finetune CodeT5/output/APPS/prediction-5_beam.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Finetune CodeT5/output/APPS/prediction-5_beam.pkl


--------------------------------------------------------------------------------
/baselines/Finetune CodeT5/output/APPS/prediction_from_file.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Finetune CodeT5/output/APPS/prediction_from_file.log


--------------------------------------------------------------------------------
/baselines/Finetune CodeT5/output/HumanEval/prediction-5_beam300_full.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Finetune CodeT5/output/HumanEval/prediction-5_beam300_full.pkl


--------------------------------------------------------------------------------
/baselines/Finetune CodeT5/output/HumanEval/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Finetune CodeT5/output/HumanEval/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/Finetune CodeT5/output/HumanEval/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Finetune CodeT5/output/HumanEval/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/Finetune CodeT5/output/HumanEval/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Finetune CodeT5/output/HumanEval/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/Finetune CodeT5/output/MBPP/prediction-5_beam300_full.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Finetune CodeT5/output/MBPP/prediction-5_beam300_full.pkl


--------------------------------------------------------------------------------
/baselines/Finetune CodeT5/output/MBPP/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Finetune CodeT5/output/MBPP/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/Finetune CodeT5/output/MBPP/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Finetune CodeT5/output/MBPP/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/Finetune CodeT5/output/MBPP/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Finetune CodeT5/output/MBPP/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/OpenAI.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/OpenAI.py


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/openai_gpt35_apps_testcase_n5_seed42_0613_executable.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/openai_gpt35_apps_testcase_n5_seed42_0613_executable.json


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank1_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank1_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank1_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank1_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank1_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank1_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank2_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank2_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank2_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank2_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank2_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank2_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank3_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank3_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank3_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank3_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank3_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank3_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank4_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank4_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank4_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank4_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/APPS/prediction_from_file_rank4_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/APPS/prediction_from_file_rank4_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/openai_gpt35_humaneval_testcase_n5_seed42_1106_full.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/openai_gpt35_humaneval_testcase_n5_seed42_1106_full.json


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank1_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank1_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank1_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank1_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank1_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank1_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank2_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank2_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank2_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank2_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank2_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank2_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank3_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank3_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank3_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank3_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank3_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank3_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank4_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank4_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank4_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank4_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank4_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/HumanEval/prediction_from_file_rank4_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/openai_gpt35_mbpp_testcase_n5_seed42_1106_full.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/openai_gpt35_mbpp_testcase_n5_seed42_1106_full.json


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank1_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank1_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank1_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank1_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank1_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank1_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank2_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank2_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank2_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank2_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank2_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank2_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank3_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank3_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank3_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank3_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank3_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank3_single5.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank4_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank4_multi0.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank4_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank4_single3.log


--------------------------------------------------------------------------------
/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank4_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/GPT-3.5/output/MBPP/prediction_from_file_rank4_single5.log


--------------------------------------------------------------------------------
/baselines/InCoder/InCoder-6B.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/InCoder/InCoder-6B.py


--------------------------------------------------------------------------------
/baselines/InCoder/output/APPS/incoder-6B_apps_testcase_beam_executable.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/InCoder/output/APPS/incoder-6B_apps_testcase_beam_executable.json


--------------------------------------------------------------------------------
/baselines/InCoder/output/APPS/prediction_from_file.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/InCoder/output/APPS/prediction_from_file.log


--------------------------------------------------------------------------------
/baselines/InCoder/output/HumanEval/incoder-6B_humaneval_testcase_beam_full.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/InCoder/output/HumanEval/incoder-6B_humaneval_testcase_beam_full.json


--------------------------------------------------------------------------------
/baselines/InCoder/output/HumanEval/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/InCoder/output/HumanEval/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/InCoder/output/HumanEval/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/InCoder/output/HumanEval/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/InCoder/output/HumanEval/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/InCoder/output/HumanEval/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/InCoder/output/MBPP/incoder-6B_mbpp_testcase_beam_full.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/InCoder/output/MBPP/incoder-6B_mbpp_testcase_beam_full.json


--------------------------------------------------------------------------------
/baselines/InCoder/output/MBPP/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/InCoder/output/MBPP/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/InCoder/output/MBPP/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/InCoder/output/MBPP/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/InCoder/output/MBPP/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/InCoder/output/MBPP/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/Pynguin/1_arrange_datasets.ipynb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/1_arrange_datasets.ipynb


--------------------------------------------------------------------------------
/baselines/Pynguin/2_pynguin_apps.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/2_pynguin_apps.sh


--------------------------------------------------------------------------------
/baselines/Pynguin/2_pynguin_humaneval.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/2_pynguin_humaneval.sh


--------------------------------------------------------------------------------
/baselines/Pynguin/2_pynguin_mbpp.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/2_pynguin_mbpp.sh


--------------------------------------------------------------------------------
/baselines/Pynguin/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/README.md


--------------------------------------------------------------------------------
/baselines/Pynguin/coverage_note.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/coverage_note.txt


--------------------------------------------------------------------------------
/baselines/Pynguin/evaluate_results_pynguin.ipynb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/evaluate_results_pynguin.ipynb


--------------------------------------------------------------------------------
/baselines/Pynguin/output/HumanEval/coverage_humaneval_3.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/HumanEval/coverage_humaneval_3.json


--------------------------------------------------------------------------------
/baselines/Pynguin/output/HumanEval/coverage_humaneval_5.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/HumanEval/coverage_humaneval_5.json


--------------------------------------------------------------------------------
/baselines/Pynguin/output/HumanEval/coverage_humaneval_perfect.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/HumanEval/coverage_humaneval_perfect.json


--------------------------------------------------------------------------------
/baselines/Pynguin/output/HumanEval/mutation_humaneval.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/HumanEval/mutation_humaneval.sh


--------------------------------------------------------------------------------
/baselines/Pynguin/output/HumanEval/mutation_humaneval_3.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/HumanEval/mutation_humaneval_3.txt


--------------------------------------------------------------------------------
/baselines/Pynguin/output/HumanEval/mutation_humaneval_5.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/HumanEval/mutation_humaneval_5.txt


--------------------------------------------------------------------------------
/baselines/Pynguin/output/HumanEval/mutation_humaneval_perfect.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/HumanEval/mutation_humaneval_perfect.txt


--------------------------------------------------------------------------------
/baselines/Pynguin/output/MBPP/coverage_mbpp_3.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/MBPP/coverage_mbpp_3.json


--------------------------------------------------------------------------------
/baselines/Pynguin/output/MBPP/coverage_mbpp_5.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/MBPP/coverage_mbpp_5.json


--------------------------------------------------------------------------------
/baselines/Pynguin/output/MBPP/coverage_mbpp_perfect.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/MBPP/coverage_mbpp_perfect.json


--------------------------------------------------------------------------------
/baselines/Pynguin/output/MBPP/mutation_mbpp.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/MBPP/mutation_mbpp.sh


--------------------------------------------------------------------------------
/baselines/Pynguin/output/MBPP/mutation_mbpp_3.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/MBPP/mutation_mbpp_3.txt


--------------------------------------------------------------------------------
/baselines/Pynguin/output/MBPP/mutation_mbpp_5.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/MBPP/mutation_mbpp_5.txt


--------------------------------------------------------------------------------
/baselines/Pynguin/output/MBPP/mutation_mbpp_perfect.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/Pynguin/output/MBPP/mutation_mbpp_perfect.txt


--------------------------------------------------------------------------------
/baselines/StarCoder/StarCoder.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/StarCoder/StarCoder.py


--------------------------------------------------------------------------------
/baselines/StarCoder/output/APPS/prediction_from_file.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/StarCoder/output/APPS/prediction_from_file.log


--------------------------------------------------------------------------------
/baselines/StarCoder/output/APPS/starcoder_apps_testcase_beam_executable.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/StarCoder/output/APPS/starcoder_apps_testcase_beam_executable.json


--------------------------------------------------------------------------------
/baselines/StarCoder/output/HumanEval/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/StarCoder/output/HumanEval/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/StarCoder/output/HumanEval/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/StarCoder/output/HumanEval/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/StarCoder/output/HumanEval/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/StarCoder/output/HumanEval/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/StarCoder/output/HumanEval/starcoder_humaneval_testcase_beam_full.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/StarCoder/output/HumanEval/starcoder_humaneval_testcase_beam_full.json


--------------------------------------------------------------------------------
/baselines/StarCoder/output/MBPP/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/StarCoder/output/MBPP/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/baselines/StarCoder/output/MBPP/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/StarCoder/output/MBPP/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/baselines/StarCoder/output/MBPP/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/StarCoder/output/MBPP/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/baselines/StarCoder/output/MBPP/starcoder_mbpp_testcase_beam_full.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/baselines/StarCoder/output/MBPP/starcoder_mbpp_testcase_beam_full.json


--------------------------------------------------------------------------------
/datasets/HumanEval/humaneval_test.csv:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/datasets/HumanEval/humaneval_test.csv


--------------------------------------------------------------------------------
/datasets/MBPP/mbpp_test.csv:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/datasets/MBPP/mbpp_test.csv


--------------------------------------------------------------------------------
/evaluation.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/evaluation.py


--------------------------------------------------------------------------------
/finetuning.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/finetuning.py


--------------------------------------------------------------------------------
/handlers/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/handlers/code_processing.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/handlers/code_processing.py


--------------------------------------------------------------------------------
/handlers/literals.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/handlers/literals.json


--------------------------------------------------------------------------------
/handlers/python_terminal_command.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/handlers/python_terminal_command.py


--------------------------------------------------------------------------------
/handlers/testing_util.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/handlers/testing_util.py


--------------------------------------------------------------------------------
/handlers/testing_util_v2.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/handlers/testing_util_v2.py


--------------------------------------------------------------------------------
/handlers/utils.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/handlers/utils.py


--------------------------------------------------------------------------------
/inference.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/inference.py


--------------------------------------------------------------------------------
/ppo_training.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/ppo_training.py


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/requirements.txt


--------------------------------------------------------------------------------
/results/APPS/prediction-5_beam300.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/results/APPS/prediction-5_beam300.pkl


--------------------------------------------------------------------------------
/results/APPS/prediction.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/results/APPS/prediction.log


--------------------------------------------------------------------------------
/results/APPS/prediction_from_file.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/results/APPS/prediction_from_file.log


--------------------------------------------------------------------------------
/results/HumanEval/prediction-5_beam300_full.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/results/HumanEval/prediction-5_beam300_full.pkl


--------------------------------------------------------------------------------
/results/HumanEval/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/results/HumanEval/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/results/HumanEval/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/results/HumanEval/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/results/HumanEval/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/results/HumanEval/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------
/results/MBPP/prediction-5_beam300_full.pkl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/results/MBPP/prediction-5_beam300_full.pkl


--------------------------------------------------------------------------------
/results/MBPP/prediction_from_file_rank0_multi0.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/results/MBPP/prediction_from_file_rank0_multi0.log


--------------------------------------------------------------------------------
/results/MBPP/prediction_from_file_rank0_single3.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/results/MBPP/prediction_from_file_rank0_single3.log


--------------------------------------------------------------------------------
/results/MBPP/prediction_from_file_rank0_single5.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/awsm-research/pytester/HEAD/results/MBPP/prediction_from_file_rank0_single5.log


--------------------------------------------------------------------------------