├── .gitignore ├── LICENSE ├── MANIFEST.in ├── README.md ├── bytes32 ├── __init__.py ├── alignment.py ├── compliance.py ├── utils.py ├── validity.py ├── version.py └── winnability │ ├── __init__.py │ ├── example.txt │ └── language_agent.py ├── data ├── action_test.csv ├── action_train.csv ├── distractor_test.csv ├── distractor_train.csv ├── experiment_action.csv ├── experiment_distractor.csv ├── experiment_object.csv ├── object_test.csv ├── object_train.csv ├── playthroughs │ ├── balance-scale-heaviest-playthrough.txt │ ├── balance-scale-weigh-playthrough.txt │ ├── bath-tub-water-temperature-playthrough.txt │ ├── bird-life-cycle-playthrough.txt │ ├── blood-type-playthrough.txt │ ├── boil-water-playthrough.txt │ ├── clean-energy-playthrough.txt │ ├── conductivity-playthrough.txt │ ├── cooking-playthrough.txt │ ├── dishwasher-playthrough.txt │ ├── forge-key-playthrough.txt │ ├── hang-painting-playthrough.txt │ ├── inclined-plane-playthrough.txt │ ├── lit-light-bulb-playthrough.txt │ ├── make-campfire-playthrough.txt │ ├── make-ice-cubes-playthrough.txt │ ├── metal-detector-playthrough.txt │ ├── mix-paint-playthrough.txt │ ├── multimeter-playthrough.txt │ ├── plant-tree-playthrough.txt │ ├── refrigerate-food-playthrough.txt │ ├── scale-weigh-playthrough.txt │ ├── space-walk-playthrough.txt │ ├── sunburn-playthrough.txt │ ├── sweep-floor-playthrough.txt │ ├── take-photo-playthrough.txt │ ├── thermometer-playthrough.txt │ ├── use-bandage-playthrough.txt │ ├── volume-container-playthrough.txt │ ├── volume-playthrough.txt │ ├── volume-stone-playthrough.txt │ └── wash-clothes-playthrough.txt ├── programs │ ├── balance-scale-heaviest.py │ ├── balance-scale-weigh.py │ ├── bath-tub-water-temperature.py │ ├── bird-life-cycle.py │ ├── blood-type.py │ ├── boil-water.py │ ├── clean-energy.py │ ├── conductivity.py │ ├── cooking.py │ ├── dishwasher-reductionattempt1.py │ ├── dishwasher.py │ ├── forge-key.py │ ├── hang-painting.py │ ├── inclined-plane.py │ ├── lit-lightbulb.py │ ├── make-campfire.py │ ├── make-ice-cubes.py │ ├── metal-detector.py │ ├── mix-paint.py │ ├── multimeter.py │ ├── plant-tree.py │ ├── refrigerate-food.py │ ├── scale-weigh.py │ ├── space-walk.py │ ├── sunburn.py │ ├── sweep-floor.py │ ├── take-photo.py │ ├── thermometer.py │ ├── use-bandage.py │ ├── volume-container.py │ ├── volume-stone.py │ ├── volume.py │ └── wash-clothes.py ├── test_eval.csv └── test_prompts │ ├── test_1.py │ ├── test_10.py │ ├── test_11.py │ ├── test_12.py │ ├── test_13.py │ ├── test_14.py │ ├── test_15.py │ ├── test_16.py │ ├── test_2.py │ ├── test_3.py │ ├── test_4.py │ ├── test_5.py │ ├── test_6.py │ ├── test_7.py │ ├── test_8.py │ └── test_9.py ├── requirements.txt ├── results ├── 2023-10-20 │ └── generated_games │ │ ├── output_CodeLlama-34b-Instruct-hf_CodeLlama-34b-Instruct-hf │ │ ├── 20231020_action_test_10_n_CodeLlama-34b-Instruct-hf_blood-type_generation.py │ │ ├── 20231020_action_test_10_n_CodeLlama-34b-Instruct-hf_blood-type_generation.txt │ │ ├── 20231020_action_test_10_n_CodeLlama-34b-Instruct-hf_blood-type_prompt_out.txt │ │ ├── 20231020_action_test_10_p_CodeLlama-34b-Instruct-hf_thermometer_generation.py │ │ ├── 20231020_action_test_10_p_CodeLlama-34b-Instruct-hf_thermometer_generation.txt │ │ ├── 20231020_action_test_10_p_CodeLlama-34b-Instruct-hf_thermometer_prompt_out.txt │ │ ├── 20231020_action_test_11_n_CodeLlama-34b-Instruct-hf_multimeter_generation.py │ │ ├── 20231020_action_test_11_n_CodeLlama-34b-Instruct-hf_multimeter_generation.txt │ │ ├── 20231020_action_test_11_n_CodeLlama-34b-Instruct-hf_multimeter_prompt_out.txt │ │ ├── 20231020_action_test_11_p_CodeLlama-34b-Instruct-hf_mix-paint_generation.py │ │ ├── 20231020_action_test_11_p_CodeLlama-34b-Instruct-hf_mix-paint_generation.txt │ │ ├── 20231020_action_test_11_p_CodeLlama-34b-Instruct-hf_mix-paint_prompt_out.txt │ │ ├── 20231020_action_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_generation.py │ │ ├── 20231020_action_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_generation.txt │ │ ├── 20231020_action_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_prompt_out.txt │ │ ├── 20231020_action_test_12_p_CodeLlama-34b-Instruct-hf_boil-water_generation.py │ │ ├── 20231020_action_test_12_p_CodeLlama-34b-Instruct-hf_boil-water_generation.txt │ │ ├── 20231020_action_test_12_p_CodeLlama-34b-Instruct-hf_boil-water_prompt_out.txt │ │ ├── 20231020_action_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.py │ │ ├── 20231020_action_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.txt │ │ ├── 20231020_action_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_prompt_out.txt │ │ ├── 20231020_action_test_13_p_CodeLlama-34b-Instruct-hf_cooking_generation.py │ │ ├── 20231020_action_test_13_p_CodeLlama-34b-Instruct-hf_cooking_generation.txt │ │ ├── 20231020_action_test_13_p_CodeLlama-34b-Instruct-hf_cooking_prompt_out.txt │ │ ├── 20231020_action_test_14_n_CodeLlama-34b-Instruct-hf_multimeter_generation.py │ │ ├── 20231020_action_test_14_n_CodeLlama-34b-Instruct-hf_multimeter_generation.txt │ │ ├── 20231020_action_test_14_n_CodeLlama-34b-Instruct-hf_multimeter_prompt_out.txt │ │ ├── 20231020_action_test_14_p_CodeLlama-34b-Instruct-hf_metal-detector_generation.py │ │ ├── 20231020_action_test_14_p_CodeLlama-34b-Instruct-hf_metal-detector_generation.txt │ │ ├── 20231020_action_test_14_p_CodeLlama-34b-Instruct-hf_metal-detector_prompt_out.txt │ │ ├── 20231020_action_test_15_n_CodeLlama-34b-Instruct-hf_refrigerate-food_generation.py │ │ ├── 20231020_action_test_15_n_CodeLlama-34b-Instruct-hf_refrigerate-food_generation.txt │ │ ├── 20231020_action_test_15_n_CodeLlama-34b-Instruct-hf_refrigerate-food_prompt_out.txt │ │ ├── 20231020_action_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_generation.py │ │ ├── 20231020_action_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_generation.txt │ │ ├── 20231020_action_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_prompt_out.txt │ │ ├── 20231020_action_test_16_n_CodeLlama-34b-Instruct-hf_space-walk_generation.py │ │ ├── 20231020_action_test_16_n_CodeLlama-34b-Instruct-hf_space-walk_generation.txt │ │ ├── 20231020_action_test_16_n_CodeLlama-34b-Instruct-hf_space-walk_prompt_out.txt │ │ ├── 20231020_action_test_16_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation.py │ │ ├── 20231020_action_test_16_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation.txt │ │ ├── 20231020_action_test_16_p_CodeLlama-34b-Instruct-hf_scale-weigh_prompt_out.txt │ │ ├── 20231020_action_test_1_n_CodeLlama-34b-Instruct-hf_multimeter_generation.py │ │ ├── 20231020_action_test_1_n_CodeLlama-34b-Instruct-hf_multimeter_prompt_out.txt │ │ ├── 20231020_action_test_1_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation.py │ │ ├── 20231020_action_test_1_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_prompt_out.txt │ │ ├── 20231020_action_test_2_n_CodeLlama-34b-Instruct-hf_multimeter_generation.py │ │ ├── 20231020_action_test_2_n_CodeLlama-34b-Instruct-hf_multimeter_prompt_out.txt │ │ ├── 20231020_action_test_2_p_CodeLlama-34b-Instruct-hf_forge-key_generation.py │ │ ├── 20231020_action_test_2_p_CodeLlama-34b-Instruct-hf_forge-key_prompt_out.txt │ │ ├── 20231020_action_test_3_n_CodeLlama-34b-Instruct-hf_volume_generation.py │ │ ├── 20231020_action_test_3_n_CodeLlama-34b-Instruct-hf_volume_prompt_out.txt │ │ ├── 20231020_action_test_3_p_CodeLlama-34b-Instruct-hf_take-photo_generation.py │ │ ├── 20231020_action_test_3_p_CodeLlama-34b-Instruct-hf_take-photo_prompt_out.txt │ │ ├── 20231020_action_test_4_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_generation.py │ │ ├── 20231020_action_test_4_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_prompt_out.txt │ │ ├── 20231020_action_test_4_p_CodeLlama-34b-Instruct-hf_cooking_generation.py │ │ ├── 20231020_action_test_4_p_CodeLlama-34b-Instruct-hf_cooking_prompt_out.txt │ │ ├── 20231020_action_test_5_n_CodeLlama-34b-Instruct-hf_sweep-floor_generation.py │ │ ├── 20231020_action_test_5_n_CodeLlama-34b-Instruct-hf_sweep-floor_prompt_out.txt │ │ ├── 20231020_action_test_5_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.py │ │ ├── 20231020_action_test_5_p_CodeLlama-34b-Instruct-hf_dishwasher_prompt_out.txt │ │ ├── 20231020_action_test_6_n_CodeLlama-34b-Instruct-hf_wash-clothes_generation.py │ │ ├── 20231020_action_test_6_n_CodeLlama-34b-Instruct-hf_wash-clothes_prompt_out.txt │ │ ├── 20231020_action_test_6_p_CodeLlama-34b-Instruct-hf_conductivity_generation.py │ │ ├── 20231020_action_test_6_p_CodeLlama-34b-Instruct-hf_conductivity_prompt_out.txt │ │ ├── 20231020_action_test_7_n_CodeLlama-34b-Instruct-hf_volume-container_generation.py │ │ ├── 20231020_action_test_7_n_CodeLlama-34b-Instruct-hf_volume-container_generation.txt │ │ ├── 20231020_action_test_7_n_CodeLlama-34b-Instruct-hf_volume-container_prompt_out.txt │ │ ├── 20231020_action_test_7_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.py │ │ ├── 20231020_action_test_7_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.txt │ │ ├── 20231020_action_test_7_p_CodeLlama-34b-Instruct-hf_dishwasher_prompt_out.txt │ │ ├── 20231020_action_test_8_n_CodeLlama-34b-Instruct-hf_plant-tree_generation.py │ │ ├── 20231020_action_test_8_n_CodeLlama-34b-Instruct-hf_plant-tree_generation.txt │ │ ├── 20231020_action_test_8_n_CodeLlama-34b-Instruct-hf_plant-tree_prompt_out.txt │ │ ├── 20231020_action_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_generation.py │ │ ├── 20231020_action_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_generation.txt │ │ ├── 20231020_action_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_prompt_out.txt │ │ ├── 20231020_action_test_9_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.py │ │ ├── 20231020_action_test_9_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.txt │ │ ├── 20231020_action_test_9_n_CodeLlama-34b-Instruct-hf_scale-weigh_prompt_out.txt │ │ ├── 20231020_action_test_9_p_CodeLlama-34b-Instruct-hf_volume_generation.py │ │ ├── 20231020_action_test_9_p_CodeLlama-34b-Instruct-hf_volume_generation.txt │ │ ├── 20231020_action_test_9_p_CodeLlama-34b-Instruct-hf_volume_prompt_out.txt │ │ └── 20231022_action_test_1_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_prompt_out.txt │ │ └── output_CodeLlama-34b-Instruct-meta │ │ ├── _action_test_10_n_CodeLlama-34b-Instruct_blood-type_generation.py │ │ ├── _action_test_10_n_CodeLlama-34b-Instruct_blood-type_prompt_out.txt │ │ ├── _action_test_10_p_CodeLlama-34b-Instruct_thermometer_generation.py │ │ ├── _action_test_10_p_CodeLlama-34b-Instruct_thermometer_prompt_out.txt │ │ ├── _action_test_11_n_CodeLlama-34b-Instruct_multimeter_generation.py │ │ ├── _action_test_11_n_CodeLlama-34b-Instruct_multimeter_prompt_out.txt │ │ ├── _action_test_11_p_CodeLlama-34b-Instruct_mix-paint_generation.py │ │ ├── _action_test_11_p_CodeLlama-34b-Instruct_mix-paint_prompt_out.txt │ │ ├── _action_test_12_n_CodeLlama-34b-Instruct_sunburn_generation.py │ │ ├── _action_test_12_n_CodeLlama-34b-Instruct_sunburn_prompt_out.txt │ │ ├── _action_test_12_p_CodeLlama-34b-Instruct_boil-water_generation.py │ │ ├── _action_test_12_p_CodeLlama-34b-Instruct_boil-water_prompt_out.txt │ │ ├── _action_test_13_n_CodeLlama-34b-Instruct_scale-weigh_generation.py │ │ ├── _action_test_13_n_CodeLlama-34b-Instruct_scale-weigh_prompt_out.txt │ │ ├── _action_test_13_p_CodeLlama-34b-Instruct_cooking_generation.py │ │ ├── _action_test_13_p_CodeLlama-34b-Instruct_cooking_prompt_out.txt │ │ ├── _action_test_14_n_CodeLlama-34b-Instruct_multimeter_generation.py │ │ ├── _action_test_14_n_CodeLlama-34b-Instruct_multimeter_prompt_out.txt │ │ ├── _action_test_14_p_CodeLlama-34b-Instruct_metal-detector_generation.py │ │ ├── _action_test_14_p_CodeLlama-34b-Instruct_metal-detector_prompt_out.txt │ │ ├── _action_test_15_n_CodeLlama-34b-Instruct_refrigerate-food_generation.py │ │ ├── _action_test_15_n_CodeLlama-34b-Instruct_refrigerate-food_prompt_out.txt │ │ ├── _action_test_15_p_CodeLlama-34b-Instruct_space-walk_generation.py │ │ ├── _action_test_15_p_CodeLlama-34b-Instruct_space-walk_prompt_out.txt │ │ ├── _action_test_16_n_CodeLlama-34b-Instruct_space-walk_generation.py │ │ ├── _action_test_16_n_CodeLlama-34b-Instruct_space-walk_prompt_out.txt │ │ ├── _action_test_16_p_CodeLlama-34b-Instruct_scale-weigh_generation.py │ │ ├── _action_test_16_p_CodeLlama-34b-Instruct_scale-weigh_prompt_out.txt │ │ ├── _action_test_1_n_CodeLlama-34b-Instruct_multimeter_generation.py │ │ ├── _action_test_1_n_CodeLlama-34b-Instruct_multimeter_prompt_out.txt │ │ ├── _action_test_1_p_CodeLlama-34b-Instruct_make-ice-cubes_generation.py │ │ ├── _action_test_1_p_CodeLlama-34b-Instruct_make-ice-cubes_prompt_out.txt │ │ ├── _action_test_2_n_CodeLlama-34b-Instruct_multimeter_generation.py │ │ ├── _action_test_2_n_CodeLlama-34b-Instruct_multimeter_prompt_out.txt │ │ ├── _action_test_2_p_CodeLlama-34b-Instruct_forge-key_generation.py │ │ ├── _action_test_2_p_CodeLlama-34b-Instruct_forge-key_prompt_out.txt │ │ ├── _action_test_3_n_CodeLlama-34b-Instruct_volume_generation.py │ │ ├── _action_test_3_n_CodeLlama-34b-Instruct_volume_prompt_out.txt │ │ ├── _action_test_3_p_CodeLlama-34b-Instruct_take-photo_generation.py │ │ ├── _action_test_3_p_CodeLlama-34b-Instruct_take-photo_prompt_out.txt │ │ ├── _action_test_4_n_CodeLlama-34b-Instruct_balance-scale-heaviest_generation.py │ │ ├── _action_test_4_n_CodeLlama-34b-Instruct_balance-scale-heaviest_prompt_out.txt │ │ ├── _action_test_4_p_CodeLlama-34b-Instruct_cooking_generation.py │ │ ├── _action_test_4_p_CodeLlama-34b-Instruct_cooking_prompt_out.txt │ │ ├── _action_test_5_n_CodeLlama-34b-Instruct_sweep-floor_generation.py │ │ ├── _action_test_5_n_CodeLlama-34b-Instruct_sweep-floor_prompt_out.txt │ │ ├── _action_test_5_p_CodeLlama-34b-Instruct_dishwasher_generation.py │ │ ├── _action_test_5_p_CodeLlama-34b-Instruct_dishwasher_prompt_out.txt │ │ ├── _action_test_6_n_CodeLlama-34b-Instruct_wash-clothes_generation.py │ │ ├── _action_test_6_n_CodeLlama-34b-Instruct_wash-clothes_prompt_out.txt │ │ ├── _action_test_6_p_CodeLlama-34b-Instruct_conductivity_generation.py │ │ ├── _action_test_6_p_CodeLlama-34b-Instruct_conductivity_prompt_out.txt │ │ ├── _action_test_7_n_CodeLlama-34b-Instruct_volume-container_generation.py │ │ ├── _action_test_7_n_CodeLlama-34b-Instruct_volume-container_prompt_out.txt │ │ ├── _action_test_7_p_CodeLlama-34b-Instruct_dishwasher_generation.py │ │ ├── _action_test_7_p_CodeLlama-34b-Instruct_dishwasher_prompt_out.txt │ │ ├── _action_test_8_n_CodeLlama-34b-Instruct_plant-tree_generation.py │ │ ├── _action_test_8_n_CodeLlama-34b-Instruct_plant-tree_prompt_out.txt │ │ ├── _action_test_8_p_CodeLlama-34b-Instruct_sunburn_generation.py │ │ ├── _action_test_8_p_CodeLlama-34b-Instruct_sunburn_prompt_out.txt │ │ ├── _action_test_9_n_CodeLlama-34b-Instruct_scale-weigh_generation.py │ │ ├── _action_test_9_n_CodeLlama-34b-Instruct_scale-weigh_prompt_out.txt │ │ ├── _action_test_9_p_CodeLlama-34b-Instruct_volume_generation.py │ │ ├── _action_test_9_p_CodeLlama-34b-Instruct_volume_prompt_out.txt │ │ ├── _distractor_test_10_n_CodeLlama-34b-Instruct_balance-scale-heaviest_generation.py │ │ ├── _distractor_test_10_n_CodeLlama-34b-Instruct_balance-scale-heaviest_prompt_out.txt │ │ ├── _distractor_test_10_p_CodeLlama-34b-Instruct_make-campfire_generation.py │ │ ├── _distractor_test_10_p_CodeLlama-34b-Instruct_make-campfire_prompt_out.txt │ │ ├── _distractor_test_11_n_CodeLlama-34b-Instruct_bath-tub-water-temperature_generation.py │ │ ├── _distractor_test_11_n_CodeLlama-34b-Instruct_bath-tub-water-temperature_prompt_out.txt │ │ ├── _distractor_test_11_p_CodeLlama-34b-Instruct_sweep-floor_generation.py │ │ ├── _distractor_test_11_p_CodeLlama-34b-Instruct_sweep-floor_prompt_out.txt │ │ ├── _distractor_test_12_n_CodeLlama-34b-Instruct_space-walk_generation.py │ │ ├── _distractor_test_12_n_CodeLlama-34b-Instruct_space-walk_prompt_out.txt │ │ ├── _distractor_test_12_p_CodeLlama-34b-Instruct_volume_generation.py │ │ ├── _distractor_test_12_p_CodeLlama-34b-Instruct_volume_prompt_out.txt │ │ ├── _distractor_test_13_n_CodeLlama-34b-Instruct_bath-tub-water-temperature_generation.py │ │ ├── _distractor_test_13_n_CodeLlama-34b-Instruct_bath-tub-water-temperature_prompt_out.txt │ │ ├── _distractor_test_13_p_CodeLlama-34b-Instruct_multimeter_generation.py │ │ ├── _distractor_test_13_p_CodeLlama-34b-Instruct_multimeter_prompt_out.txt │ │ ├── _distractor_test_14_n_CodeLlama-34b-Instruct_volume-stone_generation.py │ │ ├── _distractor_test_14_n_CodeLlama-34b-Instruct_volume-stone_prompt_out.txt │ │ ├── _distractor_test_14_p_CodeLlama-34b-Instruct_balance-scale-weigh_generation.py │ │ ├── _distractor_test_14_p_CodeLlama-34b-Instruct_balance-scale-weigh_prompt_out.txt │ │ ├── _distractor_test_15_n_CodeLlama-34b-Instruct_space-walk_generation.py │ │ ├── _distractor_test_15_n_CodeLlama-34b-Instruct_space-walk_prompt_out.txt │ │ ├── _distractor_test_15_p_CodeLlama-34b-Instruct_dishwasher_generation.py │ │ ├── _distractor_test_15_p_CodeLlama-34b-Instruct_dishwasher_prompt_out.txt │ │ ├── _distractor_test_16_n_CodeLlama-34b-Instruct_lit-lightbulb_generation.py │ │ ├── _distractor_test_16_n_CodeLlama-34b-Instruct_lit-lightbulb_prompt_out.txt │ │ ├── _distractor_test_16_p_CodeLlama-34b-Instruct_plant-tree_generation.py │ │ ├── _distractor_test_16_p_CodeLlama-34b-Instruct_plant-tree_prompt_out.txt │ │ ├── _distractor_test_1_n_CodeLlama-34b-Instruct_scale-weigh_generation.py │ │ ├── _distractor_test_1_n_CodeLlama-34b-Instruct_scale-weigh_prompt_out.txt │ │ ├── _distractor_test_1_p_CodeLlama-34b-Instruct_bird-life-cycle_generation.py │ │ ├── _distractor_test_1_p_CodeLlama-34b-Instruct_bird-life-cycle_prompt_out.txt │ │ ├── _distractor_test_2_n_CodeLlama-34b-Instruct_lit-lightbulb_generation.py │ │ ├── _distractor_test_2_n_CodeLlama-34b-Instruct_lit-lightbulb_prompt_out.txt │ │ ├── _distractor_test_2_p_CodeLlama-34b-Instruct_make-ice-cubes_generation.py │ │ ├── _distractor_test_2_p_CodeLlama-34b-Instruct_make-ice-cubes_prompt_out.txt │ │ ├── _distractor_test_3_n_CodeLlama-34b-Instruct_bath-tub-water-temperature_generation.py │ │ ├── _distractor_test_3_n_CodeLlama-34b-Instruct_bath-tub-water-temperature_prompt_out.txt │ │ ├── _distractor_test_3_p_CodeLlama-34b-Instruct_sunburn_generation.py │ │ ├── _distractor_test_3_p_CodeLlama-34b-Instruct_sunburn_prompt_out.txt │ │ ├── _distractor_test_4_n_CodeLlama-34b-Instruct_bath-tub-water-temperature_generation.py │ │ ├── _distractor_test_4_n_CodeLlama-34b-Instruct_bath-tub-water-temperature_prompt_out.txt │ │ ├── _distractor_test_4_p_CodeLlama-34b-Instruct_metal-detector_generation.py │ │ ├── _distractor_test_4_p_CodeLlama-34b-Instruct_metal-detector_prompt_out.txt │ │ ├── _distractor_test_5_n_CodeLlama-34b-Instruct_lit-lightbulb_generation.py │ │ ├── _distractor_test_5_n_CodeLlama-34b-Instruct_lit-lightbulb_prompt_out.txt │ │ ├── _distractor_test_5_p_CodeLlama-34b-Instruct_make-ice-cubes_generation.py │ │ ├── _distractor_test_5_p_CodeLlama-34b-Instruct_make-ice-cubes_prompt_out.txt │ │ ├── _distractor_test_6_n_CodeLlama-34b-Instruct_clean-energy_generation.py │ │ ├── _distractor_test_6_n_CodeLlama-34b-Instruct_clean-energy_prompt_out.txt │ │ ├── _distractor_test_6_p_CodeLlama-34b-Instruct_scale-weigh_generation.py │ │ ├── _distractor_test_6_p_CodeLlama-34b-Instruct_scale-weigh_prompt_out.txt │ │ ├── _distractor_test_7_n_CodeLlama-34b-Instruct_clean-energy_generation.py │ │ ├── _distractor_test_7_n_CodeLlama-34b-Instruct_clean-energy_prompt_out.txt │ │ ├── _distractor_test_7_p_CodeLlama-34b-Instruct_refrigerate-food_generation.py │ │ ├── _distractor_test_7_p_CodeLlama-34b-Instruct_refrigerate-food_prompt_out.txt │ │ ├── _distractor_test_8_n_CodeLlama-34b-Instruct_conductivity_generation.py │ │ ├── _distractor_test_8_n_CodeLlama-34b-Instruct_conductivity_prompt_out.txt │ │ ├── _distractor_test_8_p_CodeLlama-34b-Instruct_dishwasher_generation.py │ │ ├── _distractor_test_8_p_CodeLlama-34b-Instruct_dishwasher_prompt_out.txt │ │ ├── _distractor_test_9_n_CodeLlama-34b-Instruct_volume-stone_generation.py │ │ ├── _distractor_test_9_n_CodeLlama-34b-Instruct_volume-stone_prompt_out.txt │ │ ├── _distractor_test_9_p_CodeLlama-34b-Instruct_cooking_generation.py │ │ ├── _distractor_test_9_p_CodeLlama-34b-Instruct_cooking_prompt_out.txt │ │ ├── _object_test_10_n_CodeLlama-34b-Instruct_metal-detector_generation.py │ │ ├── _object_test_10_n_CodeLlama-34b-Instruct_metal-detector_prompt_out.txt │ │ ├── _object_test_10_p_CodeLlama-34b-Instruct_make-ice-cubes_generation.py │ │ ├── _object_test_10_p_CodeLlama-34b-Instruct_make-ice-cubes_prompt_out.txt │ │ ├── _object_test_11_n_CodeLlama-34b-Instruct_inclined-plane_generation.py │ │ ├── _object_test_11_n_CodeLlama-34b-Instruct_inclined-plane_prompt_out.txt │ │ ├── _object_test_11_p_CodeLlama-34b-Instruct_bath-tub-water-temperature_generation.py │ │ ├── _object_test_11_p_CodeLlama-34b-Instruct_bath-tub-water-temperature_prompt_out.txt │ │ ├── _object_test_12_n_CodeLlama-34b-Instruct_sunburn_generation.py │ │ ├── _object_test_12_n_CodeLlama-34b-Instruct_sunburn_prompt_out.txt │ │ ├── _object_test_12_p_CodeLlama-34b-Instruct_dishwasher_generation.py │ │ ├── _object_test_12_p_CodeLlama-34b-Instruct_dishwasher_prompt_out.txt │ │ ├── _object_test_13_n_CodeLlama-34b-Instruct_scale-weigh_generation.py │ │ ├── _object_test_13_n_CodeLlama-34b-Instruct_scale-weigh_prompt_out.txt │ │ ├── _object_test_13_p_CodeLlama-34b-Instruct_sunburn_generation.py │ │ ├── _object_test_13_p_CodeLlama-34b-Instruct_sunburn_prompt_out.txt │ │ ├── _object_test_14_n_CodeLlama-34b-Instruct_balance-scale-weigh_generation.py │ │ ├── _object_test_14_n_CodeLlama-34b-Instruct_balance-scale-weigh_prompt_out.txt │ │ ├── _object_test_14_p_CodeLlama-34b-Instruct_sweep-floor_generation.py │ │ ├── _object_test_14_p_CodeLlama-34b-Instruct_sweep-floor_prompt_out.txt │ │ ├── _object_test_15_n_CodeLlama-34b-Instruct_volume_generation.py │ │ ├── _object_test_15_n_CodeLlama-34b-Instruct_volume_prompt_out.txt │ │ ├── _object_test_15_p_CodeLlama-34b-Instruct_space-walk_generation.py │ │ ├── _object_test_15_p_CodeLlama-34b-Instruct_space-walk_prompt_out.txt │ │ ├── _object_test_16_n_CodeLlama-34b-Instruct_bath-tub-water-temperature_generation.py │ │ ├── _object_test_16_n_CodeLlama-34b-Instruct_bath-tub-water-temperature_prompt_out.txt │ │ ├── _object_test_16_p_CodeLlama-34b-Instruct_balance-scale-weigh_generation.py │ │ ├── _object_test_16_p_CodeLlama-34b-Instruct_balance-scale-weigh_prompt_out.txt │ │ ├── _object_test_1_n_CodeLlama-34b-Instruct_plant-tree_generation.py │ │ ├── _object_test_1_n_CodeLlama-34b-Instruct_plant-tree_prompt_out.txt │ │ ├── _object_test_1_p_CodeLlama-34b-Instruct_refrigerate-food_generation.py │ │ ├── _object_test_1_p_CodeLlama-34b-Instruct_refrigerate-food_prompt_out.txt │ │ ├── _object_test_2_n_CodeLlama-34b-Instruct_take-photo_generation.py │ │ ├── _object_test_2_n_CodeLlama-34b-Instruct_take-photo_prompt_out.txt │ │ ├── _object_test_2_p_CodeLlama-34b-Instruct_volume-stone_generation.py │ │ ├── _object_test_2_p_CodeLlama-34b-Instruct_volume-stone_prompt_out.txt │ │ ├── _object_test_3_n_CodeLlama-34b-Instruct_balance-scale-weigh_generation.py │ │ ├── _object_test_3_n_CodeLlama-34b-Instruct_balance-scale-weigh_prompt_out.txt │ │ ├── _object_test_3_p_CodeLlama-34b-Instruct_wash-clothes_generation.py │ │ ├── _object_test_3_p_CodeLlama-34b-Instruct_wash-clothes_prompt_out.txt │ │ ├── _object_test_4_n_CodeLlama-34b-Instruct_make-campfire_generation.py │ │ ├── _object_test_4_n_CodeLlama-34b-Instruct_make-campfire_prompt_out.txt │ │ ├── _object_test_4_p_CodeLlama-34b-Instruct_metal-detector_generation.py │ │ ├── _object_test_4_p_CodeLlama-34b-Instruct_metal-detector_prompt_out.txt │ │ ├── _object_test_5_n_CodeLlama-34b-Instruct_clean-energy_generation.py │ │ ├── _object_test_5_n_CodeLlama-34b-Instruct_clean-energy_prompt_out.txt │ │ ├── _object_test_5_p_CodeLlama-34b-Instruct_bath-tub-water-temperature_generation.py │ │ ├── _object_test_5_p_CodeLlama-34b-Instruct_bath-tub-water-temperature_prompt_out.txt │ │ ├── _object_test_6_n_CodeLlama-34b-Instruct_bird-life-cycle_generation.py │ │ ├── _object_test_6_n_CodeLlama-34b-Instruct_bird-life-cycle_prompt_out.txt │ │ ├── _object_test_6_p_CodeLlama-34b-Instruct_conductivity_generation.py │ │ ├── _object_test_6_p_CodeLlama-34b-Instruct_conductivity_prompt_out.txt │ │ ├── _object_test_7_n_CodeLlama-34b-Instruct_hang-painting_generation.py │ │ ├── _object_test_7_n_CodeLlama-34b-Instruct_hang-painting_prompt_out.txt │ │ ├── _object_test_7_p_CodeLlama-34b-Instruct_boil-water_generation.py │ │ ├── _object_test_7_p_CodeLlama-34b-Instruct_boil-water_prompt_out.txt │ │ ├── _object_test_8_n_CodeLlama-34b-Instruct_volume_generation.py │ │ ├── _object_test_8_n_CodeLlama-34b-Instruct_volume_prompt_out.txt │ │ ├── _object_test_8_p_CodeLlama-34b-Instruct_sunburn_generation.py │ │ ├── _object_test_8_p_CodeLlama-34b-Instruct_sunburn_prompt_out.txt │ │ ├── _object_test_9_n_CodeLlama-34b-Instruct_lit-lightbulb_generation.py │ │ ├── _object_test_9_n_CodeLlama-34b-Instruct_lit-lightbulb_prompt_out.txt │ │ ├── _object_test_9_p_CodeLlama-34b-Instruct_volume_generation.py │ │ └── _object_test_9_p_CodeLlama-34b-Instruct_volume_prompt_out.txt ├── CodeLlama-34b-Instruct │ ├── generated_games │ │ ├── 20231010_action_test_10_n_CodeLlama-34b-Instruct-hf_blood-type_generation.py │ │ ├── 20231010_action_test_10_n_CodeLlama-34b-Instruct-hf_blood-type_generation.txt │ │ ├── 20231010_action_test_10_n_CodeLlama-34b-Instruct-hf_blood-type_prompt_out.txt │ │ ├── 20231010_action_test_10_p_CodeLlama-34b-Instruct-hf_thermometer_generation.py │ │ ├── 20231010_action_test_10_p_CodeLlama-34b-Instruct-hf_thermometer_generation.txt │ │ ├── 20231010_action_test_10_p_CodeLlama-34b-Instruct-hf_thermometer_prompt_out.txt │ │ ├── 20231010_action_test_11_n_CodeLlama-34b-Instruct-hf_multimeter_generation.py │ │ ├── 20231010_action_test_11_n_CodeLlama-34b-Instruct-hf_multimeter_generation.txt │ │ ├── 20231010_action_test_11_n_CodeLlama-34b-Instruct-hf_multimeter_prompt_out.txt │ │ ├── 20231010_action_test_11_p_CodeLlama-34b-Instruct-hf_mix-paint_generation.py │ │ ├── 20231010_action_test_11_p_CodeLlama-34b-Instruct-hf_mix-paint_generation.txt │ │ ├── 20231010_action_test_11_p_CodeLlama-34b-Instruct-hf_mix-paint_prompt_out.txt │ │ ├── 20231010_action_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_generation.py │ │ ├── 20231010_action_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_generation.txt │ │ ├── 20231010_action_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_prompt_out.txt │ │ ├── 20231010_action_test_12_p_CodeLlama-34b-Instruct-hf_boil-water_generation.py │ │ ├── 20231010_action_test_12_p_CodeLlama-34b-Instruct-hf_boil-water_generation.txt │ │ ├── 20231010_action_test_12_p_CodeLlama-34b-Instruct-hf_boil-water_prompt_out.txt │ │ ├── 20231010_action_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.py │ │ ├── 20231010_action_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.txt │ │ ├── 20231010_action_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_prompt_out.txt │ │ ├── 20231010_action_test_13_p_CodeLlama-34b-Instruct-hf_cooking_generation.py │ │ ├── 20231010_action_test_13_p_CodeLlama-34b-Instruct-hf_cooking_generation.txt │ │ ├── 20231010_action_test_13_p_CodeLlama-34b-Instruct-hf_cooking_prompt_out.txt │ │ ├── 20231010_action_test_14_n_CodeLlama-34b-Instruct-hf_multimeter_generation.py │ │ ├── 20231010_action_test_14_n_CodeLlama-34b-Instruct-hf_multimeter_generation.txt │ │ ├── 20231010_action_test_14_n_CodeLlama-34b-Instruct-hf_multimeter_prompt_out.txt │ │ ├── 20231010_action_test_14_p_CodeLlama-34b-Instruct-hf_metal-detector_generation.py │ │ ├── 20231010_action_test_14_p_CodeLlama-34b-Instruct-hf_metal-detector_generation.txt │ │ ├── 20231010_action_test_14_p_CodeLlama-34b-Instruct-hf_metal-detector_prompt_out.txt │ │ ├── 20231010_action_test_15_n_CodeLlama-34b-Instruct-hf_refrigerate-food_generation.py │ │ ├── 20231010_action_test_15_n_CodeLlama-34b-Instruct-hf_refrigerate-food_generation.txt │ │ ├── 20231010_action_test_15_n_CodeLlama-34b-Instruct-hf_refrigerate-food_prompt_out.txt │ │ ├── 20231010_action_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_generation.py │ │ ├── 20231010_action_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_generation.txt │ │ ├── 20231010_action_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_prompt_out.txt │ │ ├── 20231010_action_test_16_n_CodeLlama-34b-Instruct-hf_space-walk_generation.py │ │ ├── 20231010_action_test_16_n_CodeLlama-34b-Instruct-hf_space-walk_generation.txt │ │ ├── 20231010_action_test_16_n_CodeLlama-34b-Instruct-hf_space-walk_prompt_out.txt │ │ ├── 20231010_action_test_16_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation.py │ │ ├── 20231010_action_test_16_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation.txt │ │ ├── 20231010_action_test_16_p_CodeLlama-34b-Instruct-hf_scale-weigh_prompt_out.txt │ │ ├── 20231010_action_test_1_n_CodeLlama-34b-Instruct-hf_multimeter_generation.py │ │ ├── 20231010_action_test_1_n_CodeLlama-34b-Instruct-hf_multimeter_generation.txt │ │ ├── 20231010_action_test_1_n_CodeLlama-34b-Instruct-hf_multimeter_prompt_out.txt │ │ ├── 20231010_action_test_1_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation.py │ │ ├── 20231010_action_test_1_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation.txt │ │ ├── 20231010_action_test_1_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_prompt_out.txt │ │ ├── 20231010_action_test_2_n_CodeLlama-34b-Instruct-hf_multimeter_generation.py │ │ ├── 20231010_action_test_2_n_CodeLlama-34b-Instruct-hf_multimeter_generation.txt │ │ ├── 20231010_action_test_2_n_CodeLlama-34b-Instruct-hf_multimeter_prompt_out.txt │ │ ├── 20231010_action_test_2_p_CodeLlama-34b-Instruct-hf_forge-key_generation.py │ │ ├── 20231010_action_test_2_p_CodeLlama-34b-Instruct-hf_forge-key_generation.txt │ │ ├── 20231010_action_test_2_p_CodeLlama-34b-Instruct-hf_forge-key_prompt_out.txt │ │ ├── 20231010_action_test_3_n_CodeLlama-34b-Instruct-hf_volume_generation.py │ │ ├── 20231010_action_test_3_n_CodeLlama-34b-Instruct-hf_volume_generation.txt │ │ ├── 20231010_action_test_3_n_CodeLlama-34b-Instruct-hf_volume_prompt_out.txt │ │ ├── 20231010_action_test_3_p_CodeLlama-34b-Instruct-hf_take-photo_generation.py │ │ ├── 20231010_action_test_3_p_CodeLlama-34b-Instruct-hf_take-photo_generation.txt │ │ ├── 20231010_action_test_3_p_CodeLlama-34b-Instruct-hf_take-photo_prompt_out.txt │ │ ├── 20231010_action_test_4_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_generation.py │ │ ├── 20231010_action_test_4_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_generation.txt │ │ ├── 20231010_action_test_4_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_prompt_out.txt │ │ ├── 20231010_action_test_4_p_CodeLlama-34b-Instruct-hf_cooking_generation.py │ │ ├── 20231010_action_test_4_p_CodeLlama-34b-Instruct-hf_cooking_generation.txt │ │ ├── 20231010_action_test_4_p_CodeLlama-34b-Instruct-hf_cooking_prompt_out.txt │ │ ├── 20231010_action_test_5_n_CodeLlama-34b-Instruct-hf_sweep-floor_generation.py │ │ ├── 20231010_action_test_5_n_CodeLlama-34b-Instruct-hf_sweep-floor_generation.txt │ │ ├── 20231010_action_test_5_n_CodeLlama-34b-Instruct-hf_sweep-floor_prompt_out.txt │ │ ├── 20231010_action_test_5_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.py │ │ ├── 20231010_action_test_5_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.txt │ │ ├── 20231010_action_test_5_p_CodeLlama-34b-Instruct-hf_dishwasher_prompt_out.txt │ │ ├── 20231010_action_test_6_n_CodeLlama-34b-Instruct-hf_wash-clothes_generation.py │ │ ├── 20231010_action_test_6_n_CodeLlama-34b-Instruct-hf_wash-clothes_generation.txt │ │ ├── 20231010_action_test_6_n_CodeLlama-34b-Instruct-hf_wash-clothes_prompt_out.txt │ │ ├── 20231010_action_test_6_p_CodeLlama-34b-Instruct-hf_conductivity_generation.py │ │ ├── 20231010_action_test_6_p_CodeLlama-34b-Instruct-hf_conductivity_generation.txt │ │ ├── 20231010_action_test_6_p_CodeLlama-34b-Instruct-hf_conductivity_prompt_out.txt │ │ ├── 20231010_action_test_7_n_CodeLlama-34b-Instruct-hf_volume-container_generation.py │ │ ├── 20231010_action_test_7_n_CodeLlama-34b-Instruct-hf_volume-container_generation.txt │ │ ├── 20231010_action_test_7_n_CodeLlama-34b-Instruct-hf_volume-container_prompt_out.txt │ │ ├── 20231010_action_test_7_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.py │ │ ├── 20231010_action_test_7_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.txt │ │ ├── 20231010_action_test_7_p_CodeLlama-34b-Instruct-hf_dishwasher_prompt_out.txt │ │ ├── 20231010_action_test_8_n_CodeLlama-34b-Instruct-hf_plant-tree_generation.py │ │ ├── 20231010_action_test_8_n_CodeLlama-34b-Instruct-hf_plant-tree_generation.txt │ │ ├── 20231010_action_test_8_n_CodeLlama-34b-Instruct-hf_plant-tree_prompt_out.txt │ │ ├── 20231010_action_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_generation.py │ │ ├── 20231010_action_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_generation.txt │ │ ├── 20231010_action_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_prompt_out.txt │ │ ├── 20231010_action_test_9_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.py │ │ ├── 20231010_action_test_9_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.txt │ │ ├── 20231010_action_test_9_n_CodeLlama-34b-Instruct-hf_scale-weigh_prompt_out.txt │ │ ├── 20231010_action_test_9_p_CodeLlama-34b-Instruct-hf_volume_generation.py │ │ ├── 20231010_action_test_9_p_CodeLlama-34b-Instruct-hf_volume_generation.txt │ │ ├── 20231010_action_test_9_p_CodeLlama-34b-Instruct-hf_volume_prompt_out.txt │ │ ├── 20231010_distractor_test_10_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_generation.py │ │ ├── 20231010_distractor_test_10_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_generation.txt │ │ ├── 20231010_distractor_test_10_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_prompt_out.txt │ │ ├── 20231010_distractor_test_10_p_CodeLlama-34b-Instruct-hf_make-campfire_generation.py │ │ ├── 20231010_distractor_test_10_p_CodeLlama-34b-Instruct-hf_make-campfire_generation.txt │ │ ├── 20231010_distractor_test_10_p_CodeLlama-34b-Instruct-hf_make-campfire_prompt_out.txt │ │ ├── 20231010_distractor_test_11_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.py │ │ ├── 20231010_distractor_test_11_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.txt │ │ ├── 20231010_distractor_test_11_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_prompt_out.txt │ │ ├── 20231010_distractor_test_11_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation.py │ │ ├── 20231010_distractor_test_11_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation.txt │ │ ├── 20231010_distractor_test_11_p_CodeLlama-34b-Instruct-hf_sweep-floor_prompt_out.txt │ │ ├── 20231010_distractor_test_12_n_CodeLlama-34b-Instruct-hf_space-walk_generation.py │ │ ├── 20231010_distractor_test_12_n_CodeLlama-34b-Instruct-hf_space-walk_generation.txt │ │ ├── 20231010_distractor_test_12_n_CodeLlama-34b-Instruct-hf_space-walk_prompt_out.txt │ │ ├── 20231010_distractor_test_12_p_CodeLlama-34b-Instruct-hf_volume_generation.py │ │ ├── 20231010_distractor_test_12_p_CodeLlama-34b-Instruct-hf_volume_generation.txt │ │ ├── 20231010_distractor_test_12_p_CodeLlama-34b-Instruct-hf_volume_prompt_out.txt │ │ ├── 20231010_distractor_test_13_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.py │ │ ├── 20231010_distractor_test_13_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.txt │ │ ├── 20231010_distractor_test_13_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_prompt_out.txt │ │ ├── 20231010_distractor_test_13_p_CodeLlama-34b-Instruct-hf_multimeter_generation.py │ │ ├── 20231010_distractor_test_13_p_CodeLlama-34b-Instruct-hf_multimeter_generation.txt │ │ ├── 20231010_distractor_test_13_p_CodeLlama-34b-Instruct-hf_multimeter_prompt_out.txt │ │ ├── 20231010_distractor_test_14_n_CodeLlama-34b-Instruct-hf_volume-stone_generation.py │ │ ├── 20231010_distractor_test_14_n_CodeLlama-34b-Instruct-hf_volume-stone_generation.txt │ │ ├── 20231010_distractor_test_14_n_CodeLlama-34b-Instruct-hf_volume-stone_prompt_out.txt │ │ ├── 20231010_distractor_test_14_p_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation.py │ │ ├── 20231010_distractor_test_14_p_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation.txt │ │ ├── 20231010_distractor_test_14_p_CodeLlama-34b-Instruct-hf_balance-scale-weigh_prompt_out.txt │ │ ├── 20231010_distractor_test_15_n_CodeLlama-34b-Instruct-hf_space-walk_generation.py │ │ ├── 20231010_distractor_test_15_n_CodeLlama-34b-Instruct-hf_space-walk_generation.txt │ │ ├── 20231010_distractor_test_15_n_CodeLlama-34b-Instruct-hf_space-walk_prompt_out.txt │ │ ├── 20231010_distractor_test_15_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.py │ │ ├── 20231010_distractor_test_15_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.txt │ │ ├── 20231010_distractor_test_15_p_CodeLlama-34b-Instruct-hf_dishwasher_prompt_out.txt │ │ ├── 20231010_distractor_test_16_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation.py │ │ ├── 20231010_distractor_test_16_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation.txt │ │ ├── 20231010_distractor_test_16_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_prompt_out.txt │ │ ├── 20231010_distractor_test_16_p_CodeLlama-34b-Instruct-hf_plant-tree_generation.py │ │ ├── 20231010_distractor_test_16_p_CodeLlama-34b-Instruct-hf_plant-tree_generation.txt │ │ ├── 20231010_distractor_test_16_p_CodeLlama-34b-Instruct-hf_plant-tree_prompt_out.txt │ │ ├── 20231010_distractor_test_1_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.py │ │ ├── 20231010_distractor_test_1_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.txt │ │ ├── 20231010_distractor_test_1_n_CodeLlama-34b-Instruct-hf_scale-weigh_prompt_out.txt │ │ ├── 20231010_distractor_test_1_p_CodeLlama-34b-Instruct-hf_bird-life-cycle_generation.py │ │ ├── 20231010_distractor_test_1_p_CodeLlama-34b-Instruct-hf_bird-life-cycle_generation.txt │ │ ├── 20231010_distractor_test_1_p_CodeLlama-34b-Instruct-hf_bird-life-cycle_prompt_out.txt │ │ ├── 20231010_distractor_test_2_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation.py │ │ ├── 20231010_distractor_test_2_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation.txt │ │ ├── 20231010_distractor_test_2_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_prompt_out.txt │ │ ├── 20231010_distractor_test_2_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation.py │ │ ├── 20231010_distractor_test_2_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation.txt │ │ ├── 20231010_distractor_test_2_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_prompt_out.txt │ │ ├── 20231010_distractor_test_3_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.py │ │ ├── 20231010_distractor_test_3_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.txt │ │ ├── 20231010_distractor_test_3_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_prompt_out.txt │ │ ├── 20231010_distractor_test_3_p_CodeLlama-34b-Instruct-hf_sunburn_generation.py │ │ ├── 20231010_distractor_test_3_p_CodeLlama-34b-Instruct-hf_sunburn_generation.txt │ │ ├── 20231010_distractor_test_3_p_CodeLlama-34b-Instruct-hf_sunburn_prompt_out.txt │ │ ├── 20231010_distractor_test_4_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.py │ │ ├── 20231010_distractor_test_4_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.txt │ │ ├── 20231010_distractor_test_4_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_prompt_out.txt │ │ ├── 20231010_distractor_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_generation.py │ │ ├── 20231010_distractor_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_generation.txt │ │ ├── 20231010_distractor_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_prompt_out.txt │ │ ├── 20231010_distractor_test_5_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation.py │ │ ├── 20231010_distractor_test_5_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation.txt │ │ ├── 20231010_distractor_test_5_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_prompt_out.txt │ │ ├── 20231010_distractor_test_5_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation.py │ │ ├── 20231010_distractor_test_5_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation.txt │ │ ├── 20231010_distractor_test_5_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_prompt_out.txt │ │ ├── 20231010_distractor_test_6_n_CodeLlama-34b-Instruct-hf_clean-energy_generation.py │ │ ├── 20231010_distractor_test_6_n_CodeLlama-34b-Instruct-hf_clean-energy_generation.txt │ │ ├── 20231010_distractor_test_6_n_CodeLlama-34b-Instruct-hf_clean-energy_prompt_out.txt │ │ ├── 20231010_distractor_test_6_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation.py │ │ ├── 20231010_distractor_test_6_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation.txt │ │ ├── 20231010_distractor_test_6_p_CodeLlama-34b-Instruct-hf_scale-weigh_prompt_out.txt │ │ ├── 20231010_distractor_test_7_n_CodeLlama-34b-Instruct-hf_clean-energy_generation.py │ │ ├── 20231010_distractor_test_7_n_CodeLlama-34b-Instruct-hf_clean-energy_generation.txt │ │ ├── 20231010_distractor_test_7_n_CodeLlama-34b-Instruct-hf_clean-energy_prompt_out.txt │ │ ├── 20231010_distractor_test_7_p_CodeLlama-34b-Instruct-hf_refrigerate-food_generation.py │ │ ├── 20231010_distractor_test_7_p_CodeLlama-34b-Instruct-hf_refrigerate-food_generation.txt │ │ ├── 20231010_distractor_test_7_p_CodeLlama-34b-Instruct-hf_refrigerate-food_prompt_out.txt │ │ ├── 20231010_distractor_test_8_n_CodeLlama-34b-Instruct-hf_conductivity_generation.py │ │ ├── 20231010_distractor_test_8_n_CodeLlama-34b-Instruct-hf_conductivity_generation.txt │ │ ├── 20231010_distractor_test_8_n_CodeLlama-34b-Instruct-hf_conductivity_prompt_out.txt │ │ ├── 20231010_distractor_test_8_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.py │ │ ├── 20231010_distractor_test_8_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.txt │ │ ├── 20231010_distractor_test_8_p_CodeLlama-34b-Instruct-hf_dishwasher_prompt_out.txt │ │ ├── 20231010_distractor_test_9_n_CodeLlama-34b-Instruct-hf_volume-stone_generation.py │ │ ├── 20231010_distractor_test_9_n_CodeLlama-34b-Instruct-hf_volume-stone_generation.txt │ │ ├── 20231010_distractor_test_9_n_CodeLlama-34b-Instruct-hf_volume-stone_prompt_out.txt │ │ ├── 20231010_distractor_test_9_p_CodeLlama-34b-Instruct-hf_cooking_generation.py │ │ ├── 20231010_distractor_test_9_p_CodeLlama-34b-Instruct-hf_cooking_generation.txt │ │ ├── 20231010_distractor_test_9_p_CodeLlama-34b-Instruct-hf_cooking_prompt_out.txt │ │ ├── 20231010_object_test_10_n_CodeLlama-34b-Instruct-hf_metal-detector_generation.py │ │ ├── 20231010_object_test_10_n_CodeLlama-34b-Instruct-hf_metal-detector_generation.txt │ │ ├── 20231010_object_test_10_n_CodeLlama-34b-Instruct-hf_metal-detector_prompt_out.txt │ │ ├── 20231010_object_test_10_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation.py │ │ ├── 20231010_object_test_10_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation.txt │ │ ├── 20231010_object_test_10_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_prompt_out.txt │ │ ├── 20231010_object_test_11_n_CodeLlama-34b-Instruct-hf_inclined-plane_generation.py │ │ ├── 20231010_object_test_11_n_CodeLlama-34b-Instruct-hf_inclined-plane_generation.txt │ │ ├── 20231010_object_test_11_n_CodeLlama-34b-Instruct-hf_inclined-plane_prompt_out.txt │ │ ├── 20231010_object_test_11_p_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.py │ │ ├── 20231010_object_test_11_p_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.txt │ │ ├── 20231010_object_test_11_p_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_prompt_out.txt │ │ ├── 20231010_object_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_generation.py │ │ ├── 20231010_object_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_generation.txt │ │ ├── 20231010_object_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_prompt_out.txt │ │ ├── 20231010_object_test_12_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.py │ │ ├── 20231010_object_test_12_p_CodeLlama-34b-Instruct-hf_dishwasher_generation.txt │ │ ├── 20231010_object_test_12_p_CodeLlama-34b-Instruct-hf_dishwasher_prompt_out.txt │ │ ├── 20231010_object_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.py │ │ ├── 20231010_object_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation.txt │ │ ├── 20231010_object_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_prompt_out.txt │ │ ├── 20231010_object_test_13_p_CodeLlama-34b-Instruct-hf_sunburn_generation.py │ │ ├── 20231010_object_test_13_p_CodeLlama-34b-Instruct-hf_sunburn_generation.txt │ │ ├── 20231010_object_test_13_p_CodeLlama-34b-Instruct-hf_sunburn_prompt_out.txt │ │ ├── 20231010_object_test_14_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation.py │ │ ├── 20231010_object_test_14_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation.txt │ │ ├── 20231010_object_test_14_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_prompt_out.txt │ │ ├── 20231010_object_test_14_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation.py │ │ ├── 20231010_object_test_14_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation.txt │ │ ├── 20231010_object_test_14_p_CodeLlama-34b-Instruct-hf_sweep-floor_prompt_out.txt │ │ ├── 20231010_object_test_15_n_CodeLlama-34b-Instruct-hf_volume_generation.py │ │ ├── 20231010_object_test_15_n_CodeLlama-34b-Instruct-hf_volume_generation.txt │ │ ├── 20231010_object_test_15_n_CodeLlama-34b-Instruct-hf_volume_prompt_out.txt │ │ ├── 20231010_object_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_generation.py │ │ ├── 20231010_object_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_generation.txt │ │ ├── 20231010_object_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_prompt_out.txt │ │ ├── 20231010_object_test_16_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.py │ │ ├── 20231010_object_test_16_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.txt │ │ ├── 20231010_object_test_16_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_prompt_out.txt │ │ ├── 20231010_object_test_16_p_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation.py │ │ ├── 20231010_object_test_16_p_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation.txt │ │ ├── 20231010_object_test_16_p_CodeLlama-34b-Instruct-hf_balance-scale-weigh_prompt_out.txt │ │ ├── 20231010_object_test_1_n_CodeLlama-34b-Instruct-hf_plant-tree_generation.py │ │ ├── 20231010_object_test_1_n_CodeLlama-34b-Instruct-hf_plant-tree_generation.txt │ │ ├── 20231010_object_test_1_n_CodeLlama-34b-Instruct-hf_plant-tree_prompt_out.txt │ │ ├── 20231010_object_test_1_p_CodeLlama-34b-Instruct-hf_refrigerate-food_generation.py │ │ ├── 20231010_object_test_1_p_CodeLlama-34b-Instruct-hf_refrigerate-food_generation.txt │ │ ├── 20231010_object_test_1_p_CodeLlama-34b-Instruct-hf_refrigerate-food_prompt_out.txt │ │ ├── 20231010_object_test_2_n_CodeLlama-34b-Instruct-hf_take-photo_generation.py │ │ ├── 20231010_object_test_2_n_CodeLlama-34b-Instruct-hf_take-photo_generation.txt │ │ ├── 20231010_object_test_2_n_CodeLlama-34b-Instruct-hf_take-photo_prompt_out.txt │ │ ├── 20231010_object_test_2_p_CodeLlama-34b-Instruct-hf_volume-stone_generation.py │ │ ├── 20231010_object_test_2_p_CodeLlama-34b-Instruct-hf_volume-stone_generation.txt │ │ ├── 20231010_object_test_2_p_CodeLlama-34b-Instruct-hf_volume-stone_prompt_out.txt │ │ ├── 20231010_object_test_3_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation.py │ │ ├── 20231010_object_test_3_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation.txt │ │ ├── 20231010_object_test_3_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_prompt_out.txt │ │ ├── 20231010_object_test_3_p_CodeLlama-34b-Instruct-hf_wash-clothes_generation.py │ │ ├── 20231010_object_test_3_p_CodeLlama-34b-Instruct-hf_wash-clothes_generation.txt │ │ ├── 20231010_object_test_3_p_CodeLlama-34b-Instruct-hf_wash-clothes_prompt_out.txt │ │ ├── 20231010_object_test_4_n_CodeLlama-34b-Instruct-hf_make-campfire_generation.py │ │ ├── 20231010_object_test_4_n_CodeLlama-34b-Instruct-hf_make-campfire_generation.txt │ │ ├── 20231010_object_test_4_n_CodeLlama-34b-Instruct-hf_make-campfire_prompt_out.txt │ │ ├── 20231010_object_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_generation.py │ │ ├── 20231010_object_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_generation.txt │ │ ├── 20231010_object_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_prompt_out.txt │ │ ├── 20231010_object_test_5_n_CodeLlama-34b-Instruct-hf_clean-energy_generation.py │ │ ├── 20231010_object_test_5_n_CodeLlama-34b-Instruct-hf_clean-energy_generation.txt │ │ ├── 20231010_object_test_5_n_CodeLlama-34b-Instruct-hf_clean-energy_prompt_out.txt │ │ ├── 20231010_object_test_5_p_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.py │ │ ├── 20231010_object_test_5_p_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation.txt │ │ ├── 20231010_object_test_5_p_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_prompt_out.txt │ │ ├── 20231010_object_test_6_n_CodeLlama-34b-Instruct-hf_bird-life-cycle_generation.py │ │ ├── 20231010_object_test_6_n_CodeLlama-34b-Instruct-hf_bird-life-cycle_generation.txt │ │ ├── 20231010_object_test_6_n_CodeLlama-34b-Instruct-hf_bird-life-cycle_prompt_out.txt │ │ ├── 20231010_object_test_6_p_CodeLlama-34b-Instruct-hf_conductivity_generation.py │ │ ├── 20231010_object_test_6_p_CodeLlama-34b-Instruct-hf_conductivity_generation.txt │ │ ├── 20231010_object_test_6_p_CodeLlama-34b-Instruct-hf_conductivity_prompt_out.txt │ │ ├── 20231010_object_test_7_n_CodeLlama-34b-Instruct-hf_hang-painting_generation.py │ │ ├── 20231010_object_test_7_n_CodeLlama-34b-Instruct-hf_hang-painting_generation.txt │ │ ├── 20231010_object_test_7_n_CodeLlama-34b-Instruct-hf_hang-painting_prompt_out.txt │ │ ├── 20231010_object_test_7_p_CodeLlama-34b-Instruct-hf_boil-water_generation.py │ │ ├── 20231010_object_test_7_p_CodeLlama-34b-Instruct-hf_boil-water_generation.txt │ │ ├── 20231010_object_test_7_p_CodeLlama-34b-Instruct-hf_boil-water_prompt_out.txt │ │ ├── 20231010_object_test_8_n_CodeLlama-34b-Instruct-hf_volume_generation.py │ │ ├── 20231010_object_test_8_n_CodeLlama-34b-Instruct-hf_volume_generation.txt │ │ ├── 20231010_object_test_8_n_CodeLlama-34b-Instruct-hf_volume_prompt_out.txt │ │ ├── 20231010_object_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_generation.py │ │ ├── 20231010_object_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_generation.txt │ │ ├── 20231010_object_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_prompt_out.txt │ │ ├── 20231010_object_test_9_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation.py │ │ ├── 20231010_object_test_9_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation.txt │ │ ├── 20231010_object_test_9_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_prompt_out.txt │ │ ├── 20231010_object_test_9_p_CodeLlama-34b-Instruct-hf_volume_generation.py │ │ ├── 20231010_object_test_9_p_CodeLlama-34b-Instruct-hf_volume_generation.txt │ │ └── 20231010_object_test_9_p_CodeLlama-34b-Instruct-hf_volume_prompt_out.txt │ ├── results.json │ ├── results_with_revisions.json │ └── revised_games │ │ ├── 20231010_action_test_10_n_CodeLlama-34b-Instruct-hf_blood-type_generation_v0.py │ │ ├── 20231010_action_test_10_p_CodeLlama-34b-Instruct-hf_thermometer_generation_v0.py │ │ ├── 20231010_action_test_11_n_CodeLlama-34b-Instruct-hf_multimeter_generation_v0.py │ │ ├── 20231010_action_test_11_n_CodeLlama-34b-Instruct-hf_multimeter_generation_v1.py │ │ ├── 20231010_action_test_11_n_CodeLlama-34b-Instruct-hf_multimeter_generation_v2.py │ │ ├── 20231010_action_test_11_p_CodeLlama-34b-Instruct-hf_mix-paint_generation_v0.py │ │ ├── 20231010_action_test_11_p_CodeLlama-34b-Instruct-hf_mix-paint_generation_v1.py │ │ ├── 20231010_action_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_generation_v0.py │ │ ├── 20231010_action_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_generation_v1.py │ │ ├── 20231010_action_test_12_p_CodeLlama-34b-Instruct-hf_boil-water_generation_v0.py │ │ ├── 20231010_action_test_12_p_CodeLlama-34b-Instruct-hf_boil-water_generation_v1.py │ │ ├── 20231010_action_test_12_p_CodeLlama-34b-Instruct-hf_boil-water_generation_v2.py │ │ ├── 20231010_action_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v0.py │ │ ├── 20231010_action_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v1.py │ │ ├── 20231010_action_test_13_p_CodeLlama-34b-Instruct-hf_cooking_generation_v0.py │ │ ├── 20231010_action_test_13_p_CodeLlama-34b-Instruct-hf_cooking_generation_v1.py │ │ ├── 20231010_action_test_13_p_CodeLlama-34b-Instruct-hf_cooking_generation_v2.py │ │ ├── 20231010_action_test_14_n_CodeLlama-34b-Instruct-hf_multimeter_generation_v0.py │ │ ├── 20231010_action_test_14_n_CodeLlama-34b-Instruct-hf_multimeter_generation_v1.py │ │ ├── 20231010_action_test_14_p_CodeLlama-34b-Instruct-hf_metal-detector_generation_v0.py │ │ ├── 20231010_action_test_14_p_CodeLlama-34b-Instruct-hf_metal-detector_generation_v1.py │ │ ├── 20231010_action_test_15_n_CodeLlama-34b-Instruct-hf_refrigerate-food_generation_v0.py │ │ ├── 20231010_action_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_generation_v0.py │ │ ├── 20231010_action_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_generation_v1.py │ │ ├── 20231010_action_test_16_n_CodeLlama-34b-Instruct-hf_space-walk_generation_v0.py │ │ ├── 20231010_action_test_16_n_CodeLlama-34b-Instruct-hf_space-walk_generation_v1.py │ │ ├── 20231010_action_test_16_n_CodeLlama-34b-Instruct-hf_space-walk_generation_v2.py │ │ ├── 20231010_action_test_16_n_CodeLlama-34b-Instruct-hf_space-walk_generation_v3.py │ │ ├── 20231010_action_test_16_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v0.py │ │ ├── 20231010_action_test_16_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v1.py │ │ ├── 20231010_action_test_16_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v2.py │ │ ├── 20231010_action_test_16_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v3.py │ │ ├── 20231010_action_test_1_n_CodeLlama-34b-Instruct-hf_multimeter_generation_v0.py │ │ ├── 20231010_action_test_1_n_CodeLlama-34b-Instruct-hf_multimeter_generation_v1.py │ │ ├── 20231010_action_test_1_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation_v0.py │ │ ├── 20231010_action_test_2_n_CodeLlama-34b-Instruct-hf_multimeter_generation_v0.py │ │ ├── 20231010_action_test_2_n_CodeLlama-34b-Instruct-hf_multimeter_generation_v1.py │ │ ├── 20231010_action_test_2_p_CodeLlama-34b-Instruct-hf_forge-key_generation_v0.py │ │ ├── 20231010_action_test_2_p_CodeLlama-34b-Instruct-hf_forge-key_generation_v1.py │ │ ├── 20231010_action_test_2_p_CodeLlama-34b-Instruct-hf_forge-key_generation_v2.py │ │ ├── 20231010_action_test_3_n_CodeLlama-34b-Instruct-hf_volume_generation_v0.py │ │ ├── 20231010_action_test_3_n_CodeLlama-34b-Instruct-hf_volume_generation_v1.py │ │ ├── 20231010_action_test_3_p_CodeLlama-34b-Instruct-hf_take-photo_generation_v0.py │ │ ├── 20231010_action_test_3_p_CodeLlama-34b-Instruct-hf_take-photo_generation_v1.py │ │ ├── 20231010_action_test_3_p_CodeLlama-34b-Instruct-hf_take-photo_generation_v2.py │ │ ├── 20231010_action_test_3_p_CodeLlama-34b-Instruct-hf_take-photo_generation_v3.py │ │ ├── 20231010_action_test_4_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_generation_v0.py │ │ ├── 20231010_action_test_4_p_CodeLlama-34b-Instruct-hf_cooking_generation_v0.py │ │ ├── 20231010_action_test_4_p_CodeLlama-34b-Instruct-hf_cooking_generation_v1.py │ │ ├── 20231010_action_test_4_p_CodeLlama-34b-Instruct-hf_cooking_generation_v2.py │ │ ├── 20231010_action_test_5_n_CodeLlama-34b-Instruct-hf_sweep-floor_generation_v0.py │ │ ├── 20231010_action_test_5_n_CodeLlama-34b-Instruct-hf_sweep-floor_generation_v1.py │ │ ├── 20231010_action_test_5_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v0.py │ │ ├── 20231010_action_test_5_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v1.py │ │ ├── 20231010_action_test_6_n_CodeLlama-34b-Instruct-hf_wash-clothes_generation_v0.py │ │ ├── 20231010_action_test_6_n_CodeLlama-34b-Instruct-hf_wash-clothes_generation_v1.py │ │ ├── 20231010_action_test_6_n_CodeLlama-34b-Instruct-hf_wash-clothes_generation_v2.py │ │ ├── 20231010_action_test_6_n_CodeLlama-34b-Instruct-hf_wash-clothes_generation_v3.py │ │ ├── 20231010_action_test_6_p_CodeLlama-34b-Instruct-hf_conductivity_generation_v0.py │ │ ├── 20231010_action_test_7_n_CodeLlama-34b-Instruct-hf_volume-container_generation_v0.py │ │ ├── 20231010_action_test_7_n_CodeLlama-34b-Instruct-hf_volume-container_generation_v1.py │ │ ├── 20231010_action_test_7_n_CodeLlama-34b-Instruct-hf_volume-container_generation_v2.py │ │ ├── 20231010_action_test_7_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v0.py │ │ ├── 20231010_action_test_7_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v1.py │ │ ├── 20231010_action_test_7_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v2.py │ │ ├── 20231010_action_test_7_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v3.py │ │ ├── 20231010_action_test_8_n_CodeLlama-34b-Instruct-hf_plant-tree_generation_v0.py │ │ ├── 20231010_action_test_8_n_CodeLlama-34b-Instruct-hf_plant-tree_generation_v1.py │ │ ├── 20231010_action_test_8_n_CodeLlama-34b-Instruct-hf_plant-tree_generation_v2.py │ │ ├── 20231010_action_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v0.py │ │ ├── 20231010_action_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v1.py │ │ ├── 20231010_action_test_9_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v0.py │ │ ├── 20231010_action_test_9_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v1.py │ │ ├── 20231010_action_test_9_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v2.py │ │ ├── 20231010_action_test_9_p_CodeLlama-34b-Instruct-hf_volume_generation_v0.py │ │ ├── 20231010_distractor_test_10_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_generation_v0.py │ │ ├── 20231010_distractor_test_10_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_generation_v1.py │ │ ├── 20231010_distractor_test_10_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_generation_v2.py │ │ ├── 20231010_distractor_test_10_n_CodeLlama-34b-Instruct-hf_balance-scale-heaviest_generation_v3.py │ │ ├── 20231010_distractor_test_10_p_CodeLlama-34b-Instruct-hf_make-campfire_generation_v0.py │ │ ├── 20231010_distractor_test_10_p_CodeLlama-34b-Instruct-hf_make-campfire_generation_v1.py │ │ ├── 20231010_distractor_test_10_p_CodeLlama-34b-Instruct-hf_make-campfire_generation_v2.py │ │ ├── 20231010_distractor_test_10_p_CodeLlama-34b-Instruct-hf_make-campfire_generation_v3.py │ │ ├── 20231010_distractor_test_11_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v0.py │ │ ├── 20231010_distractor_test_11_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation_v0.py │ │ ├── 20231010_distractor_test_11_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation_v1.py │ │ ├── 20231010_distractor_test_11_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation_v2.py │ │ ├── 20231010_distractor_test_11_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation_v3.py │ │ ├── 20231010_distractor_test_12_n_CodeLlama-34b-Instruct-hf_space-walk_generation_v0.py │ │ ├── 20231010_distractor_test_12_n_CodeLlama-34b-Instruct-hf_space-walk_generation_v1.py │ │ ├── 20231010_distractor_test_12_n_CodeLlama-34b-Instruct-hf_space-walk_generation_v2.py │ │ ├── 20231010_distractor_test_12_n_CodeLlama-34b-Instruct-hf_space-walk_generation_v3.py │ │ ├── 20231010_distractor_test_12_p_CodeLlama-34b-Instruct-hf_volume_generation_v0.py │ │ ├── 20231010_distractor_test_12_p_CodeLlama-34b-Instruct-hf_volume_generation_v1.py │ │ ├── 20231010_distractor_test_12_p_CodeLlama-34b-Instruct-hf_volume_generation_v2.py │ │ ├── 20231010_distractor_test_13_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v0.py │ │ ├── 20231010_distractor_test_13_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v1.py │ │ ├── 20231010_distractor_test_13_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v2.py │ │ ├── 20231010_distractor_test_13_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v3.py │ │ ├── 20231010_distractor_test_13_p_CodeLlama-34b-Instruct-hf_multimeter_generation_v0.py │ │ ├── 20231010_distractor_test_13_p_CodeLlama-34b-Instruct-hf_multimeter_generation_v1.py │ │ ├── 20231010_distractor_test_14_n_CodeLlama-34b-Instruct-hf_volume-stone_generation_v0.py │ │ ├── 20231010_distractor_test_14_n_CodeLlama-34b-Instruct-hf_volume-stone_generation_v1.py │ │ ├── 20231010_distractor_test_14_n_CodeLlama-34b-Instruct-hf_volume-stone_generation_v2.py │ │ ├── 20231010_distractor_test_14_p_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation_v0.py │ │ ├── 20231010_distractor_test_14_p_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation_v1.py │ │ ├── 20231010_distractor_test_15_n_CodeLlama-34b-Instruct-hf_space-walk_generation_v0.py │ │ ├── 20231010_distractor_test_15_n_CodeLlama-34b-Instruct-hf_space-walk_generation_v1.py │ │ ├── 20231010_distractor_test_15_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v0.py │ │ ├── 20231010_distractor_test_16_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation_v0.py │ │ ├── 20231010_distractor_test_16_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation_v1.py │ │ ├── 20231010_distractor_test_16_p_CodeLlama-34b-Instruct-hf_plant-tree_generation_v0.py │ │ ├── 20231010_distractor_test_16_p_CodeLlama-34b-Instruct-hf_plant-tree_generation_v1.py │ │ ├── 20231010_distractor_test_1_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v0.py │ │ ├── 20231010_distractor_test_1_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v1.py │ │ ├── 20231010_distractor_test_1_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v2.py │ │ ├── 20231010_distractor_test_1_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v3.py │ │ ├── 20231010_distractor_test_1_p_CodeLlama-34b-Instruct-hf_bird-life-cycle_generation_v0.py │ │ ├── 20231010_distractor_test_1_p_CodeLlama-34b-Instruct-hf_bird-life-cycle_generation_v1.py │ │ ├── 20231010_distractor_test_2_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation_v0.py │ │ ├── 20231010_distractor_test_2_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation_v1.py │ │ ├── 20231010_distractor_test_2_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation_v0.py │ │ ├── 20231010_distractor_test_2_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation_v1.py │ │ ├── 20231010_distractor_test_2_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation_v2.py │ │ ├── 20231010_distractor_test_2_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation_v3.py │ │ ├── 20231010_distractor_test_3_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v0.py │ │ ├── 20231010_distractor_test_3_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v1.py │ │ ├── 20231010_distractor_test_3_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v2.py │ │ ├── 20231010_distractor_test_3_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v3.py │ │ ├── 20231010_distractor_test_3_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v0.py │ │ ├── 20231010_distractor_test_3_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v1.py │ │ ├── 20231010_distractor_test_3_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v2.py │ │ ├── 20231010_distractor_test_3_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v3.py │ │ ├── 20231010_distractor_test_4_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v0.py │ │ ├── 20231010_distractor_test_4_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v1.py │ │ ├── 20231010_distractor_test_4_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v2.py │ │ ├── 20231010_distractor_test_4_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v3.py │ │ ├── 20231010_distractor_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_generation_v0.py │ │ ├── 20231010_distractor_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_generation_v1.py │ │ ├── 20231010_distractor_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_generation_v2.py │ │ ├── 20231010_distractor_test_5_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation_v0.py │ │ ├── 20231010_distractor_test_5_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation_v1.py │ │ ├── 20231010_distractor_test_5_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation_v0.py │ │ ├── 20231010_distractor_test_6_n_CodeLlama-34b-Instruct-hf_clean-energy_generation_v0.py │ │ ├── 20231010_distractor_test_6_n_CodeLlama-34b-Instruct-hf_clean-energy_generation_v1.py │ │ ├── 20231010_distractor_test_6_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v0.py │ │ ├── 20231010_distractor_test_6_p_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v1.py │ │ ├── 20231010_distractor_test_7_n_CodeLlama-34b-Instruct-hf_clean-energy_generation_v0.py │ │ ├── 20231010_distractor_test_7_n_CodeLlama-34b-Instruct-hf_clean-energy_generation_v1.py │ │ ├── 20231010_distractor_test_7_p_CodeLlama-34b-Instruct-hf_refrigerate-food_generation_v0.py │ │ ├── 20231010_distractor_test_8_n_CodeLlama-34b-Instruct-hf_conductivity_generation_v0.py │ │ ├── 20231010_distractor_test_8_n_CodeLlama-34b-Instruct-hf_conductivity_generation_v1.py │ │ ├── 20231010_distractor_test_8_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v0.py │ │ ├── 20231010_distractor_test_8_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v1.py │ │ ├── 20231010_distractor_test_8_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v2.py │ │ ├── 20231010_distractor_test_9_n_CodeLlama-34b-Instruct-hf_volume-stone_generation_v0.py │ │ ├── 20231010_distractor_test_9_n_CodeLlama-34b-Instruct-hf_volume-stone_generation_v1.py │ │ ├── 20231010_distractor_test_9_p_CodeLlama-34b-Instruct-hf_cooking_generation_v0.py │ │ ├── 20231010_distractor_test_9_p_CodeLlama-34b-Instruct-hf_cooking_generation_v1.py │ │ ├── 20231010_object_test_10_n_CodeLlama-34b-Instruct-hf_metal-detector_generation_v0.py │ │ ├── 20231010_object_test_10_n_CodeLlama-34b-Instruct-hf_metal-detector_generation_v1.py │ │ ├── 20231010_object_test_10_n_CodeLlama-34b-Instruct-hf_metal-detector_generation_v2.py │ │ ├── 20231010_object_test_10_p_CodeLlama-34b-Instruct-hf_make-ice-cubes_generation_v0.py │ │ ├── 20231010_object_test_11_n_CodeLlama-34b-Instruct-hf_inclined-plane_generation_v0.py │ │ ├── 20231010_object_test_11_p_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v0.py │ │ ├── 20231010_object_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_generation_v0.py │ │ ├── 20231010_object_test_12_n_CodeLlama-34b-Instruct-hf_sunburn_generation_v1.py │ │ ├── 20231010_object_test_12_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v0.py │ │ ├── 20231010_object_test_12_p_CodeLlama-34b-Instruct-hf_dishwasher_generation_v1.py │ │ ├── 20231010_object_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v0.py │ │ ├── 20231010_object_test_13_n_CodeLlama-34b-Instruct-hf_scale-weigh_generation_v1.py │ │ ├── 20231010_object_test_13_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v0.py │ │ ├── 20231010_object_test_13_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v1.py │ │ ├── 20231010_object_test_13_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v2.py │ │ ├── 20231010_object_test_13_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v3.py │ │ ├── 20231010_object_test_14_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation_v0.py │ │ ├── 20231010_object_test_14_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation_v1.py │ │ ├── 20231010_object_test_14_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation_v0.py │ │ ├── 20231010_object_test_14_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation_v1.py │ │ ├── 20231010_object_test_14_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation_v2.py │ │ ├── 20231010_object_test_14_p_CodeLlama-34b-Instruct-hf_sweep-floor_generation_v3.py │ │ ├── 20231010_object_test_15_n_CodeLlama-34b-Instruct-hf_volume_generation_v0.py │ │ ├── 20231010_object_test_15_n_CodeLlama-34b-Instruct-hf_volume_generation_v1.py │ │ ├── 20231010_object_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_generation_v0.py │ │ ├── 20231010_object_test_15_p_CodeLlama-34b-Instruct-hf_space-walk_generation_v1.py │ │ ├── 20231010_object_test_16_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v0.py │ │ ├── 20231010_object_test_16_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v1.py │ │ ├── 20231010_object_test_16_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v2.py │ │ ├── 20231010_object_test_16_n_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v3.py │ │ ├── 20231010_object_test_16_p_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation_v0.py │ │ ├── 20231010_object_test_16_p_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation_v1.py │ │ ├── 20231010_object_test_1_n_CodeLlama-34b-Instruct-hf_plant-tree_generation_v0.py │ │ ├── 20231010_object_test_1_p_CodeLlama-34b-Instruct-hf_refrigerate-food_generation_v0.py │ │ ├── 20231010_object_test_1_p_CodeLlama-34b-Instruct-hf_refrigerate-food_generation_v1.py │ │ ├── 20231010_object_test_1_p_CodeLlama-34b-Instruct-hf_refrigerate-food_generation_v2.py │ │ ├── 20231010_object_test_2_n_CodeLlama-34b-Instruct-hf_take-photo_generation_v0.py │ │ ├── 20231010_object_test_2_n_CodeLlama-34b-Instruct-hf_take-photo_generation_v1.py │ │ ├── 20231010_object_test_2_n_CodeLlama-34b-Instruct-hf_take-photo_generation_v2.py │ │ ├── 20231010_object_test_2_n_CodeLlama-34b-Instruct-hf_take-photo_generation_v3.py │ │ ├── 20231010_object_test_2_p_CodeLlama-34b-Instruct-hf_volume-stone_generation_v0.py │ │ ├── 20231010_object_test_2_p_CodeLlama-34b-Instruct-hf_volume-stone_generation_v1.py │ │ ├── 20231010_object_test_2_p_CodeLlama-34b-Instruct-hf_volume-stone_generation_v2.py │ │ ├── 20231010_object_test_3_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation_v0.py │ │ ├── 20231010_object_test_3_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation_v1.py │ │ ├── 20231010_object_test_3_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation_v2.py │ │ ├── 20231010_object_test_3_n_CodeLlama-34b-Instruct-hf_balance-scale-weigh_generation_v3.py │ │ ├── 20231010_object_test_3_p_CodeLlama-34b-Instruct-hf_wash-clothes_generation_v0.py │ │ ├── 20231010_object_test_3_p_CodeLlama-34b-Instruct-hf_wash-clothes_generation_v1.py │ │ ├── 20231010_object_test_4_n_CodeLlama-34b-Instruct-hf_make-campfire_generation_v0.py │ │ ├── 20231010_object_test_4_n_CodeLlama-34b-Instruct-hf_make-campfire_generation_v1.py │ │ ├── 20231010_object_test_4_n_CodeLlama-34b-Instruct-hf_make-campfire_generation_v2.py │ │ ├── 20231010_object_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_generation_v0.py │ │ ├── 20231010_object_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_generation_v1.py │ │ ├── 20231010_object_test_4_p_CodeLlama-34b-Instruct-hf_metal-detector_generation_v2.py │ │ ├── 20231010_object_test_5_n_CodeLlama-34b-Instruct-hf_clean-energy_generation_v0.py │ │ ├── 20231010_object_test_5_n_CodeLlama-34b-Instruct-hf_clean-energy_generation_v1.py │ │ ├── 20231010_object_test_5_p_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v0.py │ │ ├── 20231010_object_test_5_p_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v1.py │ │ ├── 20231010_object_test_5_p_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v2.py │ │ ├── 20231010_object_test_5_p_CodeLlama-34b-Instruct-hf_bath-tub-water-temperature_generation_v3.py │ │ ├── 20231010_object_test_6_n_CodeLlama-34b-Instruct-hf_bird-life-cycle_generation_v0.py │ │ ├── 20231010_object_test_6_n_CodeLlama-34b-Instruct-hf_bird-life-cycle_generation_v1.py │ │ ├── 20231010_object_test_6_p_CodeLlama-34b-Instruct-hf_conductivity_generation_v0.py │ │ ├── 20231010_object_test_7_n_CodeLlama-34b-Instruct-hf_hang-painting_generation_v0.py │ │ ├── 20231010_object_test_7_p_CodeLlama-34b-Instruct-hf_boil-water_generation_v0.py │ │ ├── 20231010_object_test_8_n_CodeLlama-34b-Instruct-hf_volume_generation_v0.py │ │ ├── 20231010_object_test_8_n_CodeLlama-34b-Instruct-hf_volume_generation_v1.py │ │ ├── 20231010_object_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v0.py │ │ ├── 20231010_object_test_8_p_CodeLlama-34b-Instruct-hf_sunburn_generation_v1.py │ │ ├── 20231010_object_test_9_n_CodeLlama-34b-Instruct-hf_lit-lightbulb_generation_v0.py │ │ └── 20231010_object_test_9_p_CodeLlama-34b-Instruct-hf_volume_generation_v0.py └── GPT-4-32k │ ├── compliance_evaluation_action.csv │ ├── compliance_evaluation_distractor.csv │ ├── compliance_evaluation_object.csv │ ├── final_games │ ├── 0512_action_test_10_n_gpt-4-32k_blood-type_generation_v0_final.py │ ├── 0512_action_test_10_p_gpt-4-32k_thermometer_generation_v3_final.py │ ├── 0512_action_test_11_n_gpt-4-32k_multimeter_generation_v3_final.py │ ├── 0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v3_final.py │ ├── 0512_action_test_12_n_gpt-4-32k_sunburn_generation_v3_final.py │ ├── 0512_action_test_12_p_gpt-4-32k_boil-water_generation_v1_final.py │ ├── 0512_action_test_13_n_gpt-4-32k_scale-weigh_generation_v0_final.py │ ├── 0512_action_test_13_p_gpt-4-32k_cooking_generation_v1_final.py │ ├── 0512_action_test_14_n_gpt-4-32k_multimeter_generation_v3_final.py │ ├── 0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v3_final.py │ ├── 0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation_v1_final.py │ ├── 0512_action_test_15_p_gpt-4-32k_space-walk_generation_v1_final.py │ ├── 0512_action_test_16_n_gpt-4-32k_space-walk_generation_v3_final.py │ ├── 0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v2_final.py │ ├── 0512_action_test_1_n_gpt-4-32k_multimeter_generation_v0_final.py │ ├── 0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v3_final.py │ ├── 0512_action_test_2_n_gpt-4-32k_multimeter_generation_v3_final.py │ ├── 0512_action_test_2_p_gpt-4-32k_forge-key_generation_v0_final.py │ ├── 0512_action_test_3_n_gpt-4-32k_volume_generation_v3_final.py │ ├── 0512_action_test_3_p_gpt-4-32k_take-photo_generation_v3_final.py │ ├── 0512_action_test_4_n_gpt-4-32k_balance-scale-heaviest_generation_v0_final.py │ ├── 0512_action_test_4_p_gpt-4-32k_cooking_generation_v0_final.py │ ├── 0512_action_test_5_n_gpt-4-32k_sweep-floor_generation_v0_final.py │ ├── 0512_action_test_5_p_gpt-4-32k_dishwasher_generation_v1_final.py │ ├── 0512_action_test_6_n_gpt-4-32k_wash-clothes_generation_v0_final.py │ ├── 0512_action_test_6_p_gpt-4-32k_conductivity_generation_v3_final.py │ ├── 0512_action_test_7_n_gpt-4-32k_volume-container_generation_v3_final.py │ ├── 0512_action_test_7_p_gpt-4-32k_dishwasher_generation_v1_final.py │ ├── 0512_action_test_8_n_gpt-4-32k_plant-tree_generation_v0_final.py │ ├── 0512_action_test_8_p_gpt-4-32k_sunburn_generation_v3_final.py │ ├── 0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v3_final.py │ ├── 0512_action_test_9_p_gpt-4-32k_volume_generation_v1_final.py │ ├── 0512_distractor_test_10_n_gpt-4-32k_balance-scale-heaviest_generation_v1_final.py │ ├── 0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v3_final.py │ ├── 0512_distractor_test_11_n_gpt-4-32k_bath-tub-water-temperature_generation_v0_final.py │ ├── 0512_distractor_test_11_p_gpt-4-32k_sweep-floor_generation_v0_final.py │ ├── 0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v2_final.py │ ├── 0512_distractor_test_12_p_gpt-4-32k_volume_generation_v0_final.py │ ├── 0512_distractor_test_13_n_gpt-4-32k_bath-tub-water-temperature_generation_v0_final.py │ ├── 0512_distractor_test_13_p_gpt-4-32k_multimeter_generation_v1_final.py │ ├── 0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v3_final.py │ ├── 0512_distractor_test_14_p_gpt-4-32k_balance-scale-weigh_generation_v1_final.py │ ├── 0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v3_final.py │ ├── 0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation_v1_final.py │ ├── 0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v3_final.py │ ├── 0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v2_final.py │ ├── 0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v3_final.py │ ├── 0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v3_final.py │ ├── 0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_generation_v0_final.py │ ├── 0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v3_final.py │ ├── 0512_distractor_test_3_n_gpt-4-32k_bath-tub-water-temperature_generation_v3_final.py │ ├── 0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v3_final.py │ ├── 0512_distractor_test_4_n_gpt-4-32k_bath-tub-water-temperature_generation_v3_final.py │ ├── 0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v3_final.py │ ├── 0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_generation_v0_final.py │ ├── 0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v2_final.py │ ├── 0512_distractor_test_6_n_gpt-4-32k_clean-energy_generation_v0_final.py │ ├── 0512_distractor_test_6_p_gpt-4-32k_scale-weigh_generation_v0_final.py │ ├── 0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation_v1_final.py │ ├── 0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v3_final.py │ ├── 0512_distractor_test_8_n_gpt-4-32k_conductivity_generation_v0_final.py │ ├── 0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v3_final.py │ ├── 0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v3_final.py │ ├── 0512_distractor_test_9_p_gpt-4-32k_cooking_generation_v1_final.py │ ├── 0512_object_test_10_n_gpt-4-32k_metal-detector_generation_v0_final.py │ ├── 0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation_v1_final.py │ ├── 0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v3_final.py │ ├── 0512_object_test_11_p_gpt-4-32k_bath-tub-water-temperature_generation_v0_final.py │ ├── 0512_object_test_12_n_gpt-4-32k_sunburn_generation_v3_final.py │ ├── 0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v2_final.py │ ├── 0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v3_final.py │ ├── 0512_object_test_13_p_gpt-4-32k_sunburn_generation_v3_final.py │ ├── 0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v3_final.py │ ├── 0512_object_test_14_p_gpt-4-32k_sweep-floor_generation_v0_final.py │ ├── 0512_object_test_15_n_gpt-4-32k_volume_generation_v0_final.py │ ├── 0512_object_test_15_p_gpt-4-32k_space-walk_generation_v3_final.py │ ├── 0512_object_test_16_n_gpt-4-32k_bath-tub-water-temperature_generation_v1_final.py │ ├── 0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v3_final.py │ ├── 0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v3_final.py │ ├── 0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v3_final.py │ ├── 0512_object_test_2_n_gpt-4-32k_take-photo_generation_v3_final.py │ ├── 0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v3_final.py │ ├── 0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v2_final.py │ ├── 0512_object_test_3_p_gpt-4-32k_wash-clothes_generation_v0_final.py │ ├── 0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v3_final.py │ ├── 0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v3_final.py │ ├── 0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v3_final.py │ ├── 0512_object_test_5_p_gpt-4-32k_bath-tub-water-temperature_generation_v3_final.py │ ├── 0512_object_test_6_n_gpt-4-32k_bird-life-cycle_generation_v0_final.py │ ├── 0512_object_test_6_p_gpt-4-32k_conductivity_generation_v0_final.py │ ├── 0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v3_final.py │ ├── 0512_object_test_7_p_gpt-4-32k_boil-water_generation_v0_final.py │ ├── 0512_object_test_8_n_gpt-4-32k_volume_generation_v0_final.py │ ├── 0512_object_test_8_p_gpt-4-32k_sunburn_generation_v3_final.py │ ├── 0512_object_test_9_n_gpt-4-32k_lit-lightbulb_generation_v0_final.py │ └── 0512_object_test_9_p_gpt-4-32k_volume_generation_v0_final.py │ ├── generated_games │ ├── 0512_action_test_10_n_gpt-4-32k_blood-type_generation.py │ ├── 0512_action_test_10_n_gpt-4-32k_blood-type_prompt_out.txt │ ├── 0512_action_test_10_p_gpt-4-32k_thermometer_generation.py │ ├── 0512_action_test_10_p_gpt-4-32k_thermometer_prompt_out.txt │ ├── 0512_action_test_11_n_gpt-4-32k_multimeter_generation.py │ ├── 0512_action_test_11_n_gpt-4-32k_multimeter_prompt_out.txt │ ├── 0512_action_test_11_p_gpt-4-32k_mix-paint_generation.py │ ├── 0512_action_test_11_p_gpt-4-32k_mix-paint_prompt_out.txt │ ├── 0512_action_test_12_n_gpt-4-32k_sunburn_generation.py │ ├── 0512_action_test_12_n_gpt-4-32k_sunburn_prompt_out.txt │ ├── 0512_action_test_12_p_gpt-4-32k_boil-water_generation.py │ ├── 0512_action_test_12_p_gpt-4-32k_boil-water_prompt_out.txt │ ├── 0512_action_test_13_n_gpt-4-32k_scale-weigh_generation.py │ ├── 0512_action_test_13_n_gpt-4-32k_scale-weigh_prompt_out.txt │ ├── 0512_action_test_13_p_gpt-4-32k_cooking_generation.py │ ├── 0512_action_test_13_p_gpt-4-32k_cooking_prompt_out.txt │ ├── 0512_action_test_14_n_gpt-4-32k_multimeter_generation.py │ ├── 0512_action_test_14_n_gpt-4-32k_multimeter_prompt_out.txt │ ├── 0512_action_test_14_p_gpt-4-32k_metal-detector_generation.py │ ├── 0512_action_test_14_p_gpt-4-32k_metal-detector_prompt_out.txt │ ├── 0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation.py │ ├── 0512_action_test_15_n_gpt-4-32k_refrigerate-food_prompt_out.txt │ ├── 0512_action_test_15_p_gpt-4-32k_space-walk_generation.py │ ├── 0512_action_test_15_p_gpt-4-32k_space-walk_prompt_out.txt │ ├── 0512_action_test_16_n_gpt-4-32k_space-walk_generation.py │ ├── 0512_action_test_16_n_gpt-4-32k_space-walk_prompt_out.txt │ ├── 0512_action_test_16_p_gpt-4-32k_scale-weigh_generation.py │ ├── 0512_action_test_16_p_gpt-4-32k_scale-weigh_prompt_out.txt │ ├── 0512_action_test_1_n_gpt-4-32k_multimeter_generation.py │ ├── 0512_action_test_1_n_gpt-4-32k_multimeter_prompt_out.txt │ ├── 0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation.py │ ├── 0512_action_test_1_p_gpt-4-32k_make-ice-cubes_prompt_out.txt │ ├── 0512_action_test_2_n_gpt-4-32k_multimeter_generation.py │ ├── 0512_action_test_2_n_gpt-4-32k_multimeter_prompt_out.txt │ ├── 0512_action_test_2_p_gpt-4-32k_forge-key_generation.py │ ├── 0512_action_test_2_p_gpt-4-32k_forge-key_prompt_out.txt │ ├── 0512_action_test_3_n_gpt-4-32k_volume_generation.py │ ├── 0512_action_test_3_n_gpt-4-32k_volume_prompt_out.txt │ ├── 0512_action_test_3_p_gpt-4-32k_take-photo_generation.py │ ├── 0512_action_test_3_p_gpt-4-32k_take-photo_prompt_out.txt │ ├── 0512_action_test_4_n_gpt-4-32k_balance-scale-heaviest_generation.py │ ├── 0512_action_test_4_n_gpt-4-32k_balance-scale-heaviest_prompt_out.txt │ ├── 0512_action_test_4_p_gpt-4-32k_cooking_generation.py │ ├── 0512_action_test_4_p_gpt-4-32k_cooking_prompt_out.txt │ ├── 0512_action_test_5_n_gpt-4-32k_sweep-floor_generation.py │ ├── 0512_action_test_5_n_gpt-4-32k_sweep-floor_prompt_out.txt │ ├── 0512_action_test_5_p_gpt-4-32k_dishwasher_generation.py │ ├── 0512_action_test_5_p_gpt-4-32k_dishwasher_prompt_out.txt │ ├── 0512_action_test_6_n_gpt-4-32k_wash-clothes_generation.py │ ├── 0512_action_test_6_n_gpt-4-32k_wash-clothes_prompt_out.txt │ ├── 0512_action_test_6_p_gpt-4-32k_conductivity_generation.py │ ├── 0512_action_test_6_p_gpt-4-32k_conductivity_prompt_out.txt │ ├── 0512_action_test_7_n_gpt-4-32k_volume-container_generation.py │ ├── 0512_action_test_7_n_gpt-4-32k_volume-container_prompt_out.txt │ ├── 0512_action_test_7_p_gpt-4-32k_dishwasher_generation.py │ ├── 0512_action_test_7_p_gpt-4-32k_dishwasher_prompt_out.txt │ ├── 0512_action_test_8_n_gpt-4-32k_plant-tree_generation.py │ ├── 0512_action_test_8_n_gpt-4-32k_plant-tree_prompt_out.txt │ ├── 0512_action_test_8_p_gpt-4-32k_sunburn_generation.py │ ├── 0512_action_test_8_p_gpt-4-32k_sunburn_prompt_out.txt │ ├── 0512_action_test_9_n_gpt-4-32k_scale-weigh_generation.py │ ├── 0512_action_test_9_n_gpt-4-32k_scale-weigh_prompt_out.txt │ ├── 0512_action_test_9_p_gpt-4-32k_volume_generation.py │ ├── 0512_action_test_9_p_gpt-4-32k_volume_prompt_out.txt │ ├── 0512_distractor_test_10_n_gpt-4-32k_balance-scale-heaviest_generation.py │ ├── 0512_distractor_test_10_n_gpt-4-32k_balance-scale-heaviest_prompt_out.txt │ ├── 0512_distractor_test_10_n_gpt-4-32k_use-bandage_prompt_out.txt │ ├── 0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation.py │ ├── 0512_distractor_test_10_p_gpt-4-32k_make-campfire_prompt_out.txt │ ├── 0512_distractor_test_11_n_gpt-4-32k_bath-tub-water-temperature_generation.py │ ├── 0512_distractor_test_11_n_gpt-4-32k_bath-tub-water-temperature_prompt_out.txt │ ├── 0512_distractor_test_11_p_gpt-4-32k_sweep-floor_generation.py │ ├── 0512_distractor_test_11_p_gpt-4-32k_sweep-floor_prompt_out.txt │ ├── 0512_distractor_test_12_n_gpt-4-32k_space-walk_generation.py │ ├── 0512_distractor_test_12_n_gpt-4-32k_space-walk_prompt_out.txt │ ├── 0512_distractor_test_12_p_gpt-4-32k_volume_generation.py │ ├── 0512_distractor_test_12_p_gpt-4-32k_volume_prompt_out.txt │ ├── 0512_distractor_test_13_n_gpt-4-32k_bath-tub-water-temperature_generation.py │ ├── 0512_distractor_test_13_n_gpt-4-32k_bath-tub-water-temperature_prompt_out.txt │ ├── 0512_distractor_test_13_p_gpt-4-32k_multimeter_generation.py │ ├── 0512_distractor_test_13_p_gpt-4-32k_multimeter_prompt_out.txt │ ├── 0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation.py │ ├── 0512_distractor_test_14_n_gpt-4-32k_volume-stone_prompt_out.txt │ ├── 0512_distractor_test_14_p_gpt-4-32k_balance-scale-weigh_generation.py │ ├── 0512_distractor_test_14_p_gpt-4-32k_balance-scale-weigh_prompt_out.txt │ ├── 0512_distractor_test_15_n_gpt-4-32k_space-walk_generation.py │ ├── 0512_distractor_test_15_n_gpt-4-32k_space-walk_prompt_out.txt │ ├── 0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation.py │ ├── 0512_distractor_test_15_p_gpt-4-32k_dishwasher_prompt_out.txt │ ├── 0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation.py │ ├── 0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_prompt_out.txt │ ├── 0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation.py │ ├── 0512_distractor_test_16_p_gpt-4-32k_plant-tree_prompt_out.txt │ ├── 0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation.py │ ├── 0512_distractor_test_1_n_gpt-4-32k_use-bandage_prompt_out.txt │ ├── 0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation.py │ ├── 0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_prompt_out.txt │ ├── 0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_generation.py │ ├── 0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_prompt_out.txt │ ├── 0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation.py │ ├── 0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_prompt_out.txt │ ├── 0512_distractor_test_3_n_gpt-4-32k_bath-tub-water-temperature_generation.py │ ├── 0512_distractor_test_3_n_gpt-4-32k_bath-tub-water-temperature_prompt_out.txt │ ├── 0512_distractor_test_3_p_gpt-4-32k_sunburn_generation.py │ ├── 0512_distractor_test_3_p_gpt-4-32k_sunburn_prompt_out.txt │ ├── 0512_distractor_test_4_n_gpt-4-32k_bath-tub-water-temperature_generation.py │ ├── 0512_distractor_test_4_n_gpt-4-32k_bath-tub-water-temperature_prompt_out.txt │ ├── 0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation.py │ ├── 0512_distractor_test_4_p_gpt-4-32k_metal-detector_prompt_out.txt │ ├── 0512_distractor_test_4_p_gpt-4-32k_use-bandage_prompt_out.txt │ ├── 0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_generation.py │ ├── 0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_prompt_out.txt │ ├── 0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation.py │ ├── 0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_prompt_out.txt │ ├── 0512_distractor_test_6_n_gpt-4-32k_clean-energy_generation.py │ ├── 0512_distractor_test_6_n_gpt-4-32k_clean-energy_prompt_out.txt │ ├── 0512_distractor_test_6_p_gpt-4-32k_scale-weigh_generation.py │ ├── 0512_distractor_test_6_p_gpt-4-32k_scale-weigh_prompt_out.txt │ ├── 0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation.py │ ├── 0512_distractor_test_7_n_gpt-4-32k_clean-energy_prompt_out.txt │ ├── 0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation.py │ ├── 0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_prompt_out.txt │ ├── 0512_distractor_test_8_n_gpt-4-32k_conductivity_generation.py │ ├── 0512_distractor_test_8_n_gpt-4-32k_conductivity_prompt_out.txt │ ├── 0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation.py │ ├── 0512_distractor_test_8_p_gpt-4-32k_dishwasher_prompt_out.txt │ ├── 0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation.py │ ├── 0512_distractor_test_9_n_gpt-4-32k_volume-stone_prompt_out.txt │ ├── 0512_distractor_test_9_p_gpt-4-32k_cooking_generation.py │ ├── 0512_distractor_test_9_p_gpt-4-32k_cooking_prompt_out.txt │ ├── 0512_object_test_10_n_gpt-4-32k_metal-detector_generation.py │ ├── 0512_object_test_10_n_gpt-4-32k_metal-detector_prompt_out.txt │ ├── 0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation.py │ ├── 0512_object_test_10_p_gpt-4-32k_make-ice-cubes_prompt_out.txt │ ├── 0512_object_test_11_n_gpt-4-32k_inclined-plane_generation.py │ ├── 0512_object_test_11_n_gpt-4-32k_inclined-plane_prompt_out.txt │ ├── 0512_object_test_11_p_gpt-4-32k_bath-tub-water-temperature_generation.py │ ├── 0512_object_test_11_p_gpt-4-32k_bath-tub-water-temperature_prompt_out.txt │ ├── 0512_object_test_12_n_gpt-4-32k_sunburn_generation.py │ ├── 0512_object_test_12_n_gpt-4-32k_sunburn_prompt_out.txt │ ├── 0512_object_test_12_p_gpt-4-32k_dishwasher_generation.py │ ├── 0512_object_test_12_p_gpt-4-32k_dishwasher_prompt_out.txt │ ├── 0512_object_test_13_n_gpt-4-32k_scale-weigh_generation.py │ ├── 0512_object_test_13_n_gpt-4-32k_scale-weigh_prompt_out.txt │ ├── 0512_object_test_13_p_gpt-4-32k_sunburn_generation.py │ ├── 0512_object_test_13_p_gpt-4-32k_sunburn_prompt_out.txt │ ├── 0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation.py │ ├── 0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_prompt_out.txt │ ├── 0512_object_test_14_n_gpt-4-32k_use-bandage_prompt_out.txt │ ├── 0512_object_test_14_p_gpt-4-32k_sweep-floor_generation.py │ ├── 0512_object_test_14_p_gpt-4-32k_sweep-floor_prompt_out.txt │ ├── 0512_object_test_15_n_gpt-4-32k_volume_generation.py │ ├── 0512_object_test_15_n_gpt-4-32k_volume_prompt_out.txt │ ├── 0512_object_test_15_p_gpt-4-32k_space-walk_generation.py │ ├── 0512_object_test_15_p_gpt-4-32k_space-walk_prompt_out.txt │ ├── 0512_object_test_16_n_gpt-4-32k_bath-tub-water-temperature_generation.py │ ├── 0512_object_test_16_n_gpt-4-32k_bath-tub-water-temperature_prompt_out.txt │ ├── 0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation.py │ ├── 0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_prompt_out.txt │ ├── 0512_object_test_1_n_gpt-4-32k_plant-tree_generation.py │ ├── 0512_object_test_1_n_gpt-4-32k_plant-tree_prompt_out.txt │ ├── 0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation.py │ ├── 0512_object_test_1_p_gpt-4-32k_refrigerate-food_prompt_out.txt │ ├── 0512_object_test_2_n_gpt-4-32k_take-photo_generation.py │ ├── 0512_object_test_2_n_gpt-4-32k_take-photo_prompt_out.txt │ ├── 0512_object_test_2_p_gpt-4-32k_volume-stone_generation.py │ ├── 0512_object_test_2_p_gpt-4-32k_volume-stone_prompt_out.txt │ ├── 0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation.py │ ├── 0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_prompt_out.txt │ ├── 0512_object_test_3_p_gpt-4-32k_wash-clothes_generation.py │ ├── 0512_object_test_3_p_gpt-4-32k_wash-clothes_prompt_out.txt │ ├── 0512_object_test_4_n_gpt-4-32k_make-campfire_generation.py │ ├── 0512_object_test_4_n_gpt-4-32k_make-campfire_prompt_out.txt │ ├── 0512_object_test_4_p_gpt-4-32k_metal-detector_generation.py │ ├── 0512_object_test_4_p_gpt-4-32k_metal-detector_prompt_out.txt │ ├── 0512_object_test_5_n_gpt-4-32k_clean-energy_generation.py │ ├── 0512_object_test_5_n_gpt-4-32k_clean-energy_prompt_out.txt │ ├── 0512_object_test_5_p_gpt-4-32k_bath-tub-water-temperature_generation.py │ ├── 0512_object_test_5_p_gpt-4-32k_bath-tub-water-temperature_prompt_out.txt │ ├── 0512_object_test_6_n_gpt-4-32k_bird-life-cycle_generation.py │ ├── 0512_object_test_6_n_gpt-4-32k_bird-life-cycle_prompt_out.txt │ ├── 0512_object_test_6_p_gpt-4-32k_conductivity_generation.py │ ├── 0512_object_test_6_p_gpt-4-32k_conductivity_prompt_out.txt │ ├── 0512_object_test_7_n_gpt-4-32k_hang-painting_generation.py │ ├── 0512_object_test_7_n_gpt-4-32k_hang-painting_prompt_out.txt │ ├── 0512_object_test_7_p_gpt-4-32k_boil-water_generation.py │ ├── 0512_object_test_7_p_gpt-4-32k_boil-water_prompt_out.txt │ ├── 0512_object_test_8_n_gpt-4-32k_volume_generation.py │ ├── 0512_object_test_8_n_gpt-4-32k_volume_prompt_out.txt │ ├── 0512_object_test_8_p_gpt-4-32k_sunburn_generation.py │ ├── 0512_object_test_8_p_gpt-4-32k_sunburn_prompt_out.txt │ ├── 0512_object_test_9_n_gpt-4-32k_lit-lightbulb_generation.py │ ├── 0512_object_test_9_n_gpt-4-32k_lit-lightbulb_prompt_out.txt │ ├── 0512_object_test_9_p_gpt-4-32k_volume_generation.py │ └── 0512_object_test_9_p_gpt-4-32k_volume_prompt_out.txt │ ├── pathcrawl_outputs_original_and_reflected.zip │ ├── results.json │ └── revised_games │ ├── 0512_action_test_10_n_gpt-4-32k_blood-type_generation_v0.py │ ├── 0512_action_test_10_p_gpt-4-32k_thermometer_generation_v0.py │ ├── 0512_action_test_10_p_gpt-4-32k_thermometer_generation_v1.py │ ├── 0512_action_test_10_p_gpt-4-32k_thermometer_generation_v2.py │ ├── 0512_action_test_10_p_gpt-4-32k_thermometer_generation_v3.py │ ├── 0512_action_test_11_n_gpt-4-32k_multimeter_generation_v0.py │ ├── 0512_action_test_11_n_gpt-4-32k_multimeter_generation_v1.py │ ├── 0512_action_test_11_n_gpt-4-32k_multimeter_generation_v2.py │ ├── 0512_action_test_11_n_gpt-4-32k_multimeter_generation_v3.py │ ├── 0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v0.py │ ├── 0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v1.py │ ├── 0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v2.py │ ├── 0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v3.py │ ├── 0512_action_test_12_n_gpt-4-32k_sunburn_generation_v0.py │ ├── 0512_action_test_12_n_gpt-4-32k_sunburn_generation_v1.py │ ├── 0512_action_test_12_n_gpt-4-32k_sunburn_generation_v2.py │ ├── 0512_action_test_12_n_gpt-4-32k_sunburn_generation_v3.py │ ├── 0512_action_test_12_p_gpt-4-32k_boil-water_generation_v0.py │ ├── 0512_action_test_12_p_gpt-4-32k_boil-water_generation_v1.py │ ├── 0512_action_test_13_n_gpt-4-32k_scale-weigh_generation_v0.py │ ├── 0512_action_test_13_p_gpt-4-32k_cooking_generation_v0.py │ ├── 0512_action_test_13_p_gpt-4-32k_cooking_generation_v1.py │ ├── 0512_action_test_14_n_gpt-4-32k_multimeter_generation_v0.py │ ├── 0512_action_test_14_n_gpt-4-32k_multimeter_generation_v1.py │ ├── 0512_action_test_14_n_gpt-4-32k_multimeter_generation_v2.py │ ├── 0512_action_test_14_n_gpt-4-32k_multimeter_generation_v3.py │ ├── 0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v0.py │ ├── 0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v1.py │ ├── 0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v2.py │ ├── 0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v3.py │ ├── 0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation_v0.py │ ├── 0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation_v1.py │ ├── 0512_action_test_15_p_gpt-4-32k_space-walk_generation_v0.py │ ├── 0512_action_test_15_p_gpt-4-32k_space-walk_generation_v1.py │ ├── 0512_action_test_16_n_gpt-4-32k_space-walk_generation_v0.py │ ├── 0512_action_test_16_n_gpt-4-32k_space-walk_generation_v1.py │ ├── 0512_action_test_16_n_gpt-4-32k_space-walk_generation_v2.py │ ├── 0512_action_test_16_n_gpt-4-32k_space-walk_generation_v3.py │ ├── 0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v0.py │ ├── 0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v1.py │ ├── 0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v2.py │ ├── 0512_action_test_1_n_gpt-4-32k_multimeter_generation_v0.py │ ├── 0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v0.py │ ├── 0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v1.py │ ├── 0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v2.py │ ├── 0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v3.py │ ├── 0512_action_test_2_n_gpt-4-32k_multimeter_generation_v0.py │ ├── 0512_action_test_2_n_gpt-4-32k_multimeter_generation_v1.py │ ├── 0512_action_test_2_n_gpt-4-32k_multimeter_generation_v2.py │ ├── 0512_action_test_2_n_gpt-4-32k_multimeter_generation_v3.py │ ├── 0512_action_test_2_p_gpt-4-32k_forge-key_generation_v0.py │ ├── 0512_action_test_3_n_gpt-4-32k_volume_generation_v0.py │ ├── 0512_action_test_3_n_gpt-4-32k_volume_generation_v1.py │ ├── 0512_action_test_3_n_gpt-4-32k_volume_generation_v2.py │ ├── 0512_action_test_3_n_gpt-4-32k_volume_generation_v3.py │ ├── 0512_action_test_3_p_gpt-4-32k_take-photo_generation_v0.py │ ├── 0512_action_test_3_p_gpt-4-32k_take-photo_generation_v1.py │ ├── 0512_action_test_3_p_gpt-4-32k_take-photo_generation_v2.py │ ├── 0512_action_test_3_p_gpt-4-32k_take-photo_generation_v3.py │ ├── 0512_action_test_4_n_gpt-4-32k_balance-scale-heaviest_generation_v0.py │ ├── 0512_action_test_4_p_gpt-4-32k_cooking_generation_v0.py │ ├── 0512_action_test_5_n_gpt-4-32k_sweep-floor_generation_v0.py │ ├── 0512_action_test_5_p_gpt-4-32k_dishwasher_generation_v0.py │ ├── 0512_action_test_5_p_gpt-4-32k_dishwasher_generation_v1.py │ ├── 0512_action_test_6_n_gpt-4-32k_wash-clothes_generation_v0.py │ ├── 0512_action_test_6_p_gpt-4-32k_conductivity_generation_v0.py │ ├── 0512_action_test_6_p_gpt-4-32k_conductivity_generation_v1.py │ ├── 0512_action_test_6_p_gpt-4-32k_conductivity_generation_v2.py │ ├── 0512_action_test_6_p_gpt-4-32k_conductivity_generation_v3.py │ ├── 0512_action_test_7_n_gpt-4-32k_volume-container_generation_v0.py │ ├── 0512_action_test_7_n_gpt-4-32k_volume-container_generation_v1.py │ ├── 0512_action_test_7_n_gpt-4-32k_volume-container_generation_v2.py │ ├── 0512_action_test_7_n_gpt-4-32k_volume-container_generation_v3.py │ ├── 0512_action_test_7_p_gpt-4-32k_dishwasher_generation_v0.py │ ├── 0512_action_test_7_p_gpt-4-32k_dishwasher_generation_v1.py │ ├── 0512_action_test_8_n_gpt-4-32k_plant-tree_generation_v0.py │ ├── 0512_action_test_8_p_gpt-4-32k_sunburn_generation_v0.py │ ├── 0512_action_test_8_p_gpt-4-32k_sunburn_generation_v1.py │ ├── 0512_action_test_8_p_gpt-4-32k_sunburn_generation_v2.py │ ├── 0512_action_test_8_p_gpt-4-32k_sunburn_generation_v3.py │ ├── 0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v0.py │ ├── 0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v1.py │ ├── 0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v2.py │ ├── 0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v3.py │ ├── 0512_action_test_9_p_gpt-4-32k_volume_generation_v0.py │ ├── 0512_action_test_9_p_gpt-4-32k_volume_generation_v1.py │ ├── 0512_distractor_test_10_n_gpt-4-32k_balance-scale-heaviest_generation_v0.py │ ├── 0512_distractor_test_10_n_gpt-4-32k_balance-scale-heaviest_generation_v1.py │ ├── 0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v0.py │ ├── 0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v1.py │ ├── 0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v2.py │ ├── 0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v3.py │ ├── 0512_distractor_test_11_n_gpt-4-32k_bath-tub-water-temperature_generation_v0.py │ ├── 0512_distractor_test_11_p_gpt-4-32k_sweep-floor_generation_v0.py │ ├── 0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v0.py │ ├── 0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v1.py │ ├── 0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v2.py │ ├── 0512_distractor_test_12_p_gpt-4-32k_volume_generation_v0.py │ ├── 0512_distractor_test_13_n_gpt-4-32k_bath-tub-water-temperature_generation_v0.py │ ├── 0512_distractor_test_13_p_gpt-4-32k_multimeter_generation_v0.py │ ├── 0512_distractor_test_13_p_gpt-4-32k_multimeter_generation_v1.py │ ├── 0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v0.py │ ├── 0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v1.py │ ├── 0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v2.py │ ├── 0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v3.py │ ├── 0512_distractor_test_14_p_gpt-4-32k_balance-scale-weigh_generation_v0.py │ ├── 0512_distractor_test_14_p_gpt-4-32k_balance-scale-weigh_generation_v1.py │ ├── 0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v0.py │ ├── 0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v1.py │ ├── 0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v2.py │ ├── 0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v3.py │ ├── 0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation_v0.py │ ├── 0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation_v1.py │ ├── 0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v0.py │ ├── 0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v1.py │ ├── 0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v2.py │ ├── 0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v3.py │ ├── 0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v0.py │ ├── 0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v1.py │ ├── 0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v2.py │ ├── 0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v0.py │ ├── 0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v1.py │ ├── 0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v2.py │ ├── 0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v3.py │ ├── 0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v0.py │ ├── 0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v1.py │ ├── 0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v2.py │ ├── 0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v3.py │ ├── 0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_generation_v0.py │ ├── 0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v0.py │ ├── 0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v1.py │ ├── 0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v2.py │ ├── 0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v3.py │ ├── 0512_distractor_test_3_n_gpt-4-32k_bath-tub-water-temperature_generation_v0.py │ ├── 0512_distractor_test_3_n_gpt-4-32k_bath-tub-water-temperature_generation_v1.py │ ├── 0512_distractor_test_3_n_gpt-4-32k_bath-tub-water-temperature_generation_v2.py │ ├── 0512_distractor_test_3_n_gpt-4-32k_bath-tub-water-temperature_generation_v3.py │ ├── 0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v0.py │ ├── 0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v1.py │ ├── 0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v2.py │ ├── 0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v3.py │ ├── 0512_distractor_test_4_n_gpt-4-32k_bath-tub-water-temperature_generation_v0.py │ ├── 0512_distractor_test_4_n_gpt-4-32k_bath-tub-water-temperature_generation_v1.py │ ├── 0512_distractor_test_4_n_gpt-4-32k_bath-tub-water-temperature_generation_v2.py │ ├── 0512_distractor_test_4_n_gpt-4-32k_bath-tub-water-temperature_generation_v3.py │ ├── 0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v0.py │ ├── 0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v1.py │ ├── 0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v2.py │ ├── 0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v3.py │ ├── 0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_generation_v0.py │ ├── 0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v0.py │ ├── 0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v1.py │ ├── 0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v2.py │ ├── 0512_distractor_test_6_n_gpt-4-32k_clean-energy_generation_v0.py │ ├── 0512_distractor_test_6_p_gpt-4-32k_scale-weigh_generation_v0.py │ ├── 0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation_v0.py │ ├── 0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation_v1.py │ ├── 0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v0.py │ ├── 0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v1.py │ ├── 0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v2.py │ ├── 0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v3.py │ ├── 0512_distractor_test_8_n_gpt-4-32k_conductivity_generation_v0.py │ ├── 0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v0.py │ ├── 0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v1.py │ ├── 0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v2.py │ ├── 0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v3.py │ ├── 0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v0.py │ ├── 0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v1.py │ ├── 0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v2.py │ ├── 0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v3.py │ ├── 0512_distractor_test_9_p_gpt-4-32k_cooking_generation_v0.py │ ├── 0512_distractor_test_9_p_gpt-4-32k_cooking_generation_v1.py │ ├── 0512_object_test_10_n_gpt-4-32k_metal-detector_generation_v0.py │ ├── 0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation_v0.py │ ├── 0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation_v1.py │ ├── 0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v0.py │ ├── 0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v1.py │ ├── 0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v2.py │ ├── 0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v3.py │ ├── 0512_object_test_11_p_gpt-4-32k_bath-tub-water-temperature_generation_v0.py │ ├── 0512_object_test_12_n_gpt-4-32k_sunburn_generation_v0.py │ ├── 0512_object_test_12_n_gpt-4-32k_sunburn_generation_v1.py │ ├── 0512_object_test_12_n_gpt-4-32k_sunburn_generation_v2.py │ ├── 0512_object_test_12_n_gpt-4-32k_sunburn_generation_v3.py │ ├── 0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v0.py │ ├── 0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v1.py │ ├── 0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v2.py │ ├── 0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v0.py │ ├── 0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v1.py │ ├── 0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v2.py │ ├── 0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v3.py │ ├── 0512_object_test_13_p_gpt-4-32k_sunburn_generation_v0.py │ ├── 0512_object_test_13_p_gpt-4-32k_sunburn_generation_v1.py │ ├── 0512_object_test_13_p_gpt-4-32k_sunburn_generation_v2.py │ ├── 0512_object_test_13_p_gpt-4-32k_sunburn_generation_v3.py │ ├── 0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v0.py │ ├── 0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v1.py │ ├── 0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v2.py │ ├── 0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v3.py │ ├── 0512_object_test_14_p_gpt-4-32k_sweep-floor_generation_v0.py │ ├── 0512_object_test_15_n_gpt-4-32k_volume_generation_v0.py │ ├── 0512_object_test_15_p_gpt-4-32k_space-walk_generation_v0.py │ ├── 0512_object_test_15_p_gpt-4-32k_space-walk_generation_v1.py │ ├── 0512_object_test_15_p_gpt-4-32k_space-walk_generation_v2.py │ ├── 0512_object_test_15_p_gpt-4-32k_space-walk_generation_v3.py │ ├── 0512_object_test_16_n_gpt-4-32k_bath-tub-water-temperature_generation_v0.py │ ├── 0512_object_test_16_n_gpt-4-32k_bath-tub-water-temperature_generation_v1.py │ ├── 0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v0.py │ ├── 0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v1.py │ ├── 0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v2.py │ ├── 0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v3.py │ ├── 0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v0.py │ ├── 0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v1.py │ ├── 0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v2.py │ ├── 0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v3.py │ ├── 0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v0.py │ ├── 0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v1.py │ ├── 0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v2.py │ ├── 0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v3.py │ ├── 0512_object_test_2_n_gpt-4-32k_take-photo_generation_v0.py │ ├── 0512_object_test_2_n_gpt-4-32k_take-photo_generation_v1.py │ ├── 0512_object_test_2_n_gpt-4-32k_take-photo_generation_v2.py │ ├── 0512_object_test_2_n_gpt-4-32k_take-photo_generation_v3.py │ ├── 0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v0.py │ ├── 0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v1.py │ ├── 0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v2.py │ ├── 0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v3.py │ ├── 0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v0.py │ ├── 0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v1.py │ ├── 0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v2.py │ ├── 0512_object_test_3_p_gpt-4-32k_wash-clothes_generation_v0.py │ ├── 0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v0.py │ ├── 0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v1.py │ ├── 0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v2.py │ ├── 0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v3.py │ ├── 0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v0.py │ ├── 0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v1.py │ ├── 0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v2.py │ ├── 0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v3.py │ ├── 0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v0.py │ ├── 0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v1.py │ ├── 0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v2.py │ ├── 0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v3.py │ ├── 0512_object_test_5_p_gpt-4-32k_bath-tub-water-temperature_generation_v0.py │ ├── 0512_object_test_5_p_gpt-4-32k_bath-tub-water-temperature_generation_v1.py │ ├── 0512_object_test_5_p_gpt-4-32k_bath-tub-water-temperature_generation_v2.py │ ├── 0512_object_test_5_p_gpt-4-32k_bath-tub-water-temperature_generation_v3.py │ ├── 0512_object_test_6_n_gpt-4-32k_bird-life-cycle_generation_v0.py │ ├── 0512_object_test_6_p_gpt-4-32k_conductivity_generation_v0.py │ ├── 0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v0.py │ ├── 0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v1.py │ ├── 0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v2.py │ ├── 0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v3.py │ ├── 0512_object_test_7_p_gpt-4-32k_boil-water_generation_v0.py │ ├── 0512_object_test_8_n_gpt-4-32k_volume_generation_v0.py │ ├── 0512_object_test_8_p_gpt-4-32k_sunburn_generation_v0.py │ ├── 0512_object_test_8_p_gpt-4-32k_sunburn_generation_v1.py │ ├── 0512_object_test_8_p_gpt-4-32k_sunburn_generation_v2.py │ ├── 0512_object_test_8_p_gpt-4-32k_sunburn_generation_v3.py │ ├── 0512_object_test_9_n_gpt-4-32k_lit-lightbulb_generation_v0.py │ └── 0512_object_test_9_p_gpt-4-32k_volume_generation_v0.py ├── scripts ├── generate_experiment_file.py ├── make_figure4.py ├── make_table2.py ├── make_table3.py ├── run_code_evaluation.py ├── run_code_generation.py └── run_code_reflection.py └── setup.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/LICENSE -------------------------------------------------------------------------------- /MANIFEST.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/MANIFEST.in -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/README.md -------------------------------------------------------------------------------- /bytes32/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/bytes32/__init__.py -------------------------------------------------------------------------------- /bytes32/alignment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/bytes32/alignment.py -------------------------------------------------------------------------------- /bytes32/compliance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/bytes32/compliance.py -------------------------------------------------------------------------------- /bytes32/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/bytes32/utils.py -------------------------------------------------------------------------------- /bytes32/validity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/bytes32/validity.py -------------------------------------------------------------------------------- /bytes32/version.py: -------------------------------------------------------------------------------- 1 | __version__ = '1.1.1' 2 | -------------------------------------------------------------------------------- /bytes32/winnability/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /bytes32/winnability/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/bytes32/winnability/example.txt -------------------------------------------------------------------------------- /bytes32/winnability/language_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/bytes32/winnability/language_agent.py -------------------------------------------------------------------------------- /data/action_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/action_test.csv -------------------------------------------------------------------------------- /data/action_train.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/action_train.csv -------------------------------------------------------------------------------- /data/distractor_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/distractor_test.csv -------------------------------------------------------------------------------- /data/distractor_train.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/distractor_train.csv -------------------------------------------------------------------------------- /data/experiment_action.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/experiment_action.csv -------------------------------------------------------------------------------- /data/experiment_distractor.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/experiment_distractor.csv -------------------------------------------------------------------------------- /data/experiment_object.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/experiment_object.csv -------------------------------------------------------------------------------- /data/object_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/object_test.csv -------------------------------------------------------------------------------- /data/object_train.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/object_train.csv -------------------------------------------------------------------------------- /data/playthroughs/balance-scale-heaviest-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/balance-scale-heaviest-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/balance-scale-weigh-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/balance-scale-weigh-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/bath-tub-water-temperature-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/bath-tub-water-temperature-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/bird-life-cycle-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/bird-life-cycle-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/blood-type-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/blood-type-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/boil-water-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/boil-water-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/clean-energy-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/clean-energy-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/conductivity-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/conductivity-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/cooking-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/cooking-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/dishwasher-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/dishwasher-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/forge-key-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/forge-key-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/hang-painting-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/hang-painting-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/inclined-plane-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/inclined-plane-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/lit-light-bulb-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/lit-light-bulb-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/make-campfire-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/make-campfire-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/make-ice-cubes-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/make-ice-cubes-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/metal-detector-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/metal-detector-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/mix-paint-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/mix-paint-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/multimeter-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/multimeter-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/plant-tree-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/plant-tree-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/refrigerate-food-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/refrigerate-food-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/scale-weigh-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/scale-weigh-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/space-walk-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/space-walk-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/sunburn-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/sunburn-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/sweep-floor-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/sweep-floor-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/take-photo-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/take-photo-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/thermometer-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/thermometer-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/use-bandage-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/use-bandage-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/volume-container-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/volume-container-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/volume-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/volume-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/volume-stone-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/volume-stone-playthrough.txt -------------------------------------------------------------------------------- /data/playthroughs/wash-clothes-playthrough.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/playthroughs/wash-clothes-playthrough.txt -------------------------------------------------------------------------------- /data/programs/balance-scale-heaviest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/balance-scale-heaviest.py -------------------------------------------------------------------------------- /data/programs/balance-scale-weigh.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/balance-scale-weigh.py -------------------------------------------------------------------------------- /data/programs/bath-tub-water-temperature.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/bath-tub-water-temperature.py -------------------------------------------------------------------------------- /data/programs/bird-life-cycle.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/bird-life-cycle.py -------------------------------------------------------------------------------- /data/programs/blood-type.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/blood-type.py -------------------------------------------------------------------------------- /data/programs/boil-water.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/boil-water.py -------------------------------------------------------------------------------- /data/programs/clean-energy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/clean-energy.py -------------------------------------------------------------------------------- /data/programs/conductivity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/conductivity.py -------------------------------------------------------------------------------- /data/programs/cooking.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/cooking.py -------------------------------------------------------------------------------- /data/programs/dishwasher-reductionattempt1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/dishwasher-reductionattempt1.py -------------------------------------------------------------------------------- /data/programs/dishwasher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/dishwasher.py -------------------------------------------------------------------------------- /data/programs/forge-key.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/forge-key.py -------------------------------------------------------------------------------- /data/programs/hang-painting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/hang-painting.py -------------------------------------------------------------------------------- /data/programs/inclined-plane.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/inclined-plane.py -------------------------------------------------------------------------------- /data/programs/lit-lightbulb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/lit-lightbulb.py -------------------------------------------------------------------------------- /data/programs/make-campfire.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/make-campfire.py -------------------------------------------------------------------------------- /data/programs/make-ice-cubes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/make-ice-cubes.py -------------------------------------------------------------------------------- /data/programs/metal-detector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/metal-detector.py -------------------------------------------------------------------------------- /data/programs/mix-paint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/mix-paint.py -------------------------------------------------------------------------------- /data/programs/multimeter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/multimeter.py -------------------------------------------------------------------------------- /data/programs/plant-tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/plant-tree.py -------------------------------------------------------------------------------- /data/programs/refrigerate-food.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/refrigerate-food.py -------------------------------------------------------------------------------- /data/programs/scale-weigh.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/scale-weigh.py -------------------------------------------------------------------------------- /data/programs/space-walk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/space-walk.py -------------------------------------------------------------------------------- /data/programs/sunburn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/sunburn.py -------------------------------------------------------------------------------- /data/programs/sweep-floor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/sweep-floor.py -------------------------------------------------------------------------------- /data/programs/take-photo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/take-photo.py -------------------------------------------------------------------------------- /data/programs/thermometer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/thermometer.py -------------------------------------------------------------------------------- /data/programs/use-bandage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/use-bandage.py -------------------------------------------------------------------------------- /data/programs/volume-container.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/volume-container.py -------------------------------------------------------------------------------- /data/programs/volume-stone.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/volume-stone.py -------------------------------------------------------------------------------- /data/programs/volume.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/volume.py -------------------------------------------------------------------------------- /data/programs/wash-clothes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/programs/wash-clothes.py -------------------------------------------------------------------------------- /data/test_eval.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_eval.csv -------------------------------------------------------------------------------- /data/test_prompts/test_1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_1.py -------------------------------------------------------------------------------- /data/test_prompts/test_10.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_10.py -------------------------------------------------------------------------------- /data/test_prompts/test_11.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_11.py -------------------------------------------------------------------------------- /data/test_prompts/test_12.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_12.py -------------------------------------------------------------------------------- /data/test_prompts/test_13.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_13.py -------------------------------------------------------------------------------- /data/test_prompts/test_14.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_14.py -------------------------------------------------------------------------------- /data/test_prompts/test_15.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_15.py -------------------------------------------------------------------------------- /data/test_prompts/test_16.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_16.py -------------------------------------------------------------------------------- /data/test_prompts/test_2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_2.py -------------------------------------------------------------------------------- /data/test_prompts/test_3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_3.py -------------------------------------------------------------------------------- /data/test_prompts/test_4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_4.py -------------------------------------------------------------------------------- /data/test_prompts/test_5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_5.py -------------------------------------------------------------------------------- /data/test_prompts/test_6.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_6.py -------------------------------------------------------------------------------- /data/test_prompts/test_7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_7.py -------------------------------------------------------------------------------- /data/test_prompts/test_8.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_8.py -------------------------------------------------------------------------------- /data/test_prompts/test_9.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/data/test_prompts/test_9.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | openai>=1.0.0 2 | tiktoken 3 | pandas 4 | tqdm 5 | plotly 6 | tenacity -------------------------------------------------------------------------------- /results/2023-10-20/generated_games/output_CodeLlama-34b-Instruct-meta/_distractor_test_16_n_CodeLlama-34b-Instruct_lit-lightbulb_generation.py: -------------------------------------------------------------------------------- 1 | Here is a possible implementation of the task in Python: -------------------------------------------------------------------------------- /results/2023-10-20/generated_games/output_CodeLlama-34b-Instruct-meta/_object_test_16_n_CodeLlama-34b-Instruct_bath-tub-water-temperature_generation.py: -------------------------------------------------------------------------------- 1 | Here is a possible implementation of the task in Python: -------------------------------------------------------------------------------- /results/CodeLlama-34b-Instruct/results.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/CodeLlama-34b-Instruct/results.json -------------------------------------------------------------------------------- /results/CodeLlama-34b-Instruct/results_with_revisions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/CodeLlama-34b-Instruct/results_with_revisions.json -------------------------------------------------------------------------------- /results/CodeLlama-34b-Instruct/revised_games/20231010_action_test_5_n_CodeLlama-34b-Instruct-hf_sweep-floor_generation_v1.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /results/CodeLlama-34b-Instruct/revised_games/20231010_object_test_3_p_CodeLlama-34b-Instruct-hf_wash-clothes_generation_v1.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /results/GPT-4-32k/compliance_evaluation_action.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/compliance_evaluation_action.csv -------------------------------------------------------------------------------- /results/GPT-4-32k/compliance_evaluation_distractor.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/compliance_evaluation_distractor.csv -------------------------------------------------------------------------------- /results/GPT-4-32k/compliance_evaluation_object.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/compliance_evaluation_object.csv -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_10_n_gpt-4-32k_blood-type_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_10_n_gpt-4-32k_blood-type_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_12_p_gpt-4-32k_boil-water_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_12_p_gpt-4-32k_boil-water_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_13_n_gpt-4-32k_scale-weigh_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_13_n_gpt-4-32k_scale-weigh_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_13_p_gpt-4-32k_cooking_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_13_p_gpt-4-32k_cooking_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_15_p_gpt-4-32k_space-walk_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_15_p_gpt-4-32k_space-walk_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v2_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v2_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_1_n_gpt-4-32k_multimeter_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_1_n_gpt-4-32k_multimeter_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_2_p_gpt-4-32k_forge-key_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_2_p_gpt-4-32k_forge-key_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_3_n_gpt-4-32k_volume_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_3_n_gpt-4-32k_volume_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_4_p_gpt-4-32k_cooking_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_4_p_gpt-4-32k_cooking_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_5_n_gpt-4-32k_sweep-floor_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_5_n_gpt-4-32k_sweep-floor_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_5_p_gpt-4-32k_dishwasher_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_5_p_gpt-4-32k_dishwasher_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_6_n_gpt-4-32k_wash-clothes_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_6_n_gpt-4-32k_wash-clothes_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_7_p_gpt-4-32k_dishwasher_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_7_p_gpt-4-32k_dishwasher_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_8_n_gpt-4-32k_plant-tree_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_8_n_gpt-4-32k_plant-tree_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_action_test_9_p_gpt-4-32k_volume_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_action_test_9_p_gpt-4-32k_volume_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_11_p_gpt-4-32k_sweep-floor_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_11_p_gpt-4-32k_sweep-floor_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v2_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v2_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_12_p_gpt-4-32k_volume_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_12_p_gpt-4-32k_volume_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_13_p_gpt-4-32k_multimeter_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_13_p_gpt-4-32k_multimeter_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v2_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v2_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v2_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v2_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_6_n_gpt-4-32k_clean-energy_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_6_n_gpt-4-32k_clean-energy_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_6_p_gpt-4-32k_scale-weigh_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_6_p_gpt-4-32k_scale-weigh_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_8_n_gpt-4-32k_conductivity_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_8_n_gpt-4-32k_conductivity_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_distractor_test_9_p_gpt-4-32k_cooking_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_distractor_test_9_p_gpt-4-32k_cooking_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_10_n_gpt-4-32k_metal-detector_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_10_n_gpt-4-32k_metal-detector_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation_v1_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation_v1_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v2_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v2_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_14_p_gpt-4-32k_sweep-floor_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_14_p_gpt-4-32k_sweep-floor_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_15_n_gpt-4-32k_volume_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_15_n_gpt-4-32k_volume_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v2_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v2_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_3_p_gpt-4-32k_wash-clothes_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_3_p_gpt-4-32k_wash-clothes_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_6_n_gpt-4-32k_bird-life-cycle_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_6_n_gpt-4-32k_bird-life-cycle_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_6_p_gpt-4-32k_conductivity_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_6_p_gpt-4-32k_conductivity_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_7_p_gpt-4-32k_boil-water_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_7_p_gpt-4-32k_boil-water_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_8_n_gpt-4-32k_volume_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_8_n_gpt-4-32k_volume_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation_v3_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation_v3_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_9_n_gpt-4-32k_lit-lightbulb_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_9_n_gpt-4-32k_lit-lightbulb_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/final_games/0512_object_test_9_p_gpt-4-32k_volume_generation_v0_final.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/final_games/0512_object_test_9_p_gpt-4-32k_volume_generation_v0_final.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_10_n_gpt-4-32k_blood-type_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_10_n_gpt-4-32k_blood-type_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_10_n_gpt-4-32k_blood-type_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_10_n_gpt-4-32k_blood-type_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_10_p_gpt-4-32k_thermometer_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_10_p_gpt-4-32k_thermometer_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_11_n_gpt-4-32k_multimeter_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_11_n_gpt-4-32k_multimeter_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_11_p_gpt-4-32k_mix-paint_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_11_p_gpt-4-32k_mix-paint_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_12_n_gpt-4-32k_sunburn_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_12_n_gpt-4-32k_sunburn_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_12_p_gpt-4-32k_boil-water_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_12_p_gpt-4-32k_boil-water_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_12_p_gpt-4-32k_boil-water_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_12_p_gpt-4-32k_boil-water_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_13_n_gpt-4-32k_scale-weigh_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_13_n_gpt-4-32k_scale-weigh_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_13_n_gpt-4-32k_scale-weigh_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_13_n_gpt-4-32k_scale-weigh_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_13_p_gpt-4-32k_cooking_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_13_p_gpt-4-32k_cooking_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_13_p_gpt-4-32k_cooking_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_13_p_gpt-4-32k_cooking_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_14_n_gpt-4-32k_multimeter_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_14_n_gpt-4-32k_multimeter_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_14_p_gpt-4-32k_metal-detector_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_14_p_gpt-4-32k_metal-detector_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_15_n_gpt-4-32k_refrigerate-food_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_15_n_gpt-4-32k_refrigerate-food_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_15_p_gpt-4-32k_space-walk_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_15_p_gpt-4-32k_space-walk_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_15_p_gpt-4-32k_space-walk_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_15_p_gpt-4-32k_space-walk_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_16_n_gpt-4-32k_space-walk_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_16_n_gpt-4-32k_space-walk_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_1_n_gpt-4-32k_multimeter_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_1_n_gpt-4-32k_multimeter_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_1_n_gpt-4-32k_multimeter_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_1_n_gpt-4-32k_multimeter_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_2_n_gpt-4-32k_multimeter_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_2_n_gpt-4-32k_multimeter_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_2_p_gpt-4-32k_forge-key_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_2_p_gpt-4-32k_forge-key_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_2_p_gpt-4-32k_forge-key_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_2_p_gpt-4-32k_forge-key_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_3_n_gpt-4-32k_volume_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_3_n_gpt-4-32k_volume_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_3_n_gpt-4-32k_volume_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_3_n_gpt-4-32k_volume_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_3_p_gpt-4-32k_take-photo_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_3_p_gpt-4-32k_take-photo_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_4_n_gpt-4-32k_balance-scale-heaviest_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_4_n_gpt-4-32k_balance-scale-heaviest_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_4_n_gpt-4-32k_balance-scale-heaviest_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_4_n_gpt-4-32k_balance-scale-heaviest_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_4_p_gpt-4-32k_cooking_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_4_p_gpt-4-32k_cooking_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_4_p_gpt-4-32k_cooking_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_4_p_gpt-4-32k_cooking_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_5_n_gpt-4-32k_sweep-floor_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_5_n_gpt-4-32k_sweep-floor_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_5_n_gpt-4-32k_sweep-floor_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_5_n_gpt-4-32k_sweep-floor_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_5_p_gpt-4-32k_dishwasher_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_5_p_gpt-4-32k_dishwasher_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_5_p_gpt-4-32k_dishwasher_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_5_p_gpt-4-32k_dishwasher_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_6_n_gpt-4-32k_wash-clothes_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_6_n_gpt-4-32k_wash-clothes_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_6_n_gpt-4-32k_wash-clothes_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_6_n_gpt-4-32k_wash-clothes_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_6_p_gpt-4-32k_conductivity_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_6_p_gpt-4-32k_conductivity_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_7_n_gpt-4-32k_volume-container_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_7_n_gpt-4-32k_volume-container_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_7_p_gpt-4-32k_dishwasher_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_7_p_gpt-4-32k_dishwasher_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_7_p_gpt-4-32k_dishwasher_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_7_p_gpt-4-32k_dishwasher_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_8_n_gpt-4-32k_plant-tree_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_8_n_gpt-4-32k_plant-tree_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_8_n_gpt-4-32k_plant-tree_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_8_n_gpt-4-32k_plant-tree_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_8_p_gpt-4-32k_sunburn_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_8_p_gpt-4-32k_sunburn_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_9_p_gpt-4-32k_volume_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_9_p_gpt-4-32k_volume_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_action_test_9_p_gpt-4-32k_volume_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_action_test_9_p_gpt-4-32k_volume_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_10_n_gpt-4-32k_use-bandage_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_10_n_gpt-4-32k_use-bandage_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_11_p_gpt-4-32k_sweep-floor_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_11_p_gpt-4-32k_sweep-floor_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_11_p_gpt-4-32k_sweep-floor_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_11_p_gpt-4-32k_sweep-floor_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_12_p_gpt-4-32k_volume_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_12_p_gpt-4-32k_volume_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_12_p_gpt-4-32k_volume_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_12_p_gpt-4-32k_volume_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_13_p_gpt-4-32k_multimeter_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_13_p_gpt-4-32k_multimeter_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_13_p_gpt-4-32k_multimeter_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_13_p_gpt-4-32k_multimeter_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_14_p_gpt-4-32k_balance-scale-weigh_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_14_p_gpt-4-32k_balance-scale-weigh_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_15_p_gpt-4-32k_dishwasher_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_15_p_gpt-4-32k_dishwasher_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_4_p_gpt-4-32k_use-bandage_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_4_p_gpt-4-32k_use-bandage_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_6_n_gpt-4-32k_clean-energy_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_6_n_gpt-4-32k_clean-energy_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_6_n_gpt-4-32k_clean-energy_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_6_n_gpt-4-32k_clean-energy_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_6_p_gpt-4-32k_scale-weigh_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_6_p_gpt-4-32k_scale-weigh_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_6_p_gpt-4-32k_scale-weigh_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_6_p_gpt-4-32k_scale-weigh_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_7_n_gpt-4-32k_clean-energy_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_7_n_gpt-4-32k_clean-energy_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_8_n_gpt-4-32k_conductivity_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_8_n_gpt-4-32k_conductivity_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_8_n_gpt-4-32k_conductivity_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_8_n_gpt-4-32k_conductivity_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_9_p_gpt-4-32k_cooking_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_9_p_gpt-4-32k_cooking_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_distractor_test_9_p_gpt-4-32k_cooking_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_distractor_test_9_p_gpt-4-32k_cooking_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_10_n_gpt-4-32k_metal-detector_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_10_n_gpt-4-32k_metal-detector_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_10_n_gpt-4-32k_metal-detector_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_10_n_gpt-4-32k_metal-detector_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_10_p_gpt-4-32k_make-ice-cubes_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_10_p_gpt-4-32k_make-ice-cubes_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_12_n_gpt-4-32k_sunburn_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_12_n_gpt-4-32k_sunburn_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_12_p_gpt-4-32k_dishwasher_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_12_p_gpt-4-32k_dishwasher_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_12_p_gpt-4-32k_dishwasher_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_12_p_gpt-4-32k_dishwasher_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_13_p_gpt-4-32k_sunburn_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_13_p_gpt-4-32k_sunburn_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_14_n_gpt-4-32k_use-bandage_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_14_n_gpt-4-32k_use-bandage_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_14_p_gpt-4-32k_sweep-floor_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_14_p_gpt-4-32k_sweep-floor_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_14_p_gpt-4-32k_sweep-floor_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_14_p_gpt-4-32k_sweep-floor_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_15_n_gpt-4-32k_volume_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_15_n_gpt-4-32k_volume_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_15_n_gpt-4-32k_volume_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_15_n_gpt-4-32k_volume_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_15_p_gpt-4-32k_space-walk_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_15_p_gpt-4-32k_space-walk_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_1_n_gpt-4-32k_plant-tree_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_1_n_gpt-4-32k_plant-tree_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_2_n_gpt-4-32k_take-photo_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_2_n_gpt-4-32k_take-photo_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_2_p_gpt-4-32k_volume-stone_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_2_p_gpt-4-32k_volume-stone_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_3_p_gpt-4-32k_wash-clothes_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_3_p_gpt-4-32k_wash-clothes_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_3_p_gpt-4-32k_wash-clothes_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_3_p_gpt-4-32k_wash-clothes_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_4_n_gpt-4-32k_make-campfire_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_4_n_gpt-4-32k_make-campfire_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_4_p_gpt-4-32k_metal-detector_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_4_p_gpt-4-32k_metal-detector_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_5_n_gpt-4-32k_clean-energy_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_5_n_gpt-4-32k_clean-energy_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_6_n_gpt-4-32k_bird-life-cycle_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_6_n_gpt-4-32k_bird-life-cycle_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_6_n_gpt-4-32k_bird-life-cycle_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_6_n_gpt-4-32k_bird-life-cycle_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_6_p_gpt-4-32k_conductivity_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_6_p_gpt-4-32k_conductivity_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_6_p_gpt-4-32k_conductivity_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_6_p_gpt-4-32k_conductivity_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_7_n_gpt-4-32k_hang-painting_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_7_n_gpt-4-32k_hang-painting_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_7_p_gpt-4-32k_boil-water_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_7_p_gpt-4-32k_boil-water_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_7_p_gpt-4-32k_boil-water_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_7_p_gpt-4-32k_boil-water_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_8_n_gpt-4-32k_volume_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_8_n_gpt-4-32k_volume_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_8_n_gpt-4-32k_volume_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_8_n_gpt-4-32k_volume_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_8_p_gpt-4-32k_sunburn_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_8_p_gpt-4-32k_sunburn_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_9_n_gpt-4-32k_lit-lightbulb_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_9_n_gpt-4-32k_lit-lightbulb_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_9_n_gpt-4-32k_lit-lightbulb_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_9_n_gpt-4-32k_lit-lightbulb_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_9_p_gpt-4-32k_volume_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_9_p_gpt-4-32k_volume_generation.py -------------------------------------------------------------------------------- /results/GPT-4-32k/generated_games/0512_object_test_9_p_gpt-4-32k_volume_prompt_out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/generated_games/0512_object_test_9_p_gpt-4-32k_volume_prompt_out.txt -------------------------------------------------------------------------------- /results/GPT-4-32k/pathcrawl_outputs_original_and_reflected.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/pathcrawl_outputs_original_and_reflected.zip -------------------------------------------------------------------------------- /results/GPT-4-32k/results.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/results.json -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_10_n_gpt-4-32k_blood-type_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_10_n_gpt-4-32k_blood-type_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_10_p_gpt-4-32k_thermometer_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_11_n_gpt-4-32k_multimeter_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_11_p_gpt-4-32k_mix-paint_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_12_n_gpt-4-32k_sunburn_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_12_p_gpt-4-32k_boil-water_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_12_p_gpt-4-32k_boil-water_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_12_p_gpt-4-32k_boil-water_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_12_p_gpt-4-32k_boil-water_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_13_n_gpt-4-32k_scale-weigh_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_13_n_gpt-4-32k_scale-weigh_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_13_p_gpt-4-32k_cooking_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_13_p_gpt-4-32k_cooking_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_13_p_gpt-4-32k_cooking_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_13_p_gpt-4-32k_cooking_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_14_n_gpt-4-32k_multimeter_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_14_p_gpt-4-32k_metal-detector_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_15_n_gpt-4-32k_refrigerate-food_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_15_p_gpt-4-32k_space-walk_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_15_p_gpt-4-32k_space-walk_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_15_p_gpt-4-32k_space-walk_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_15_p_gpt-4-32k_space-walk_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_16_n_gpt-4-32k_space-walk_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_16_p_gpt-4-32k_scale-weigh_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_1_n_gpt-4-32k_multimeter_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_1_n_gpt-4-32k_multimeter_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_1_p_gpt-4-32k_make-ice-cubes_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_2_n_gpt-4-32k_multimeter_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_2_p_gpt-4-32k_forge-key_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_2_p_gpt-4-32k_forge-key_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_3_n_gpt-4-32k_volume_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_3_n_gpt-4-32k_volume_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_3_n_gpt-4-32k_volume_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_3_n_gpt-4-32k_volume_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_3_n_gpt-4-32k_volume_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_3_n_gpt-4-32k_volume_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_3_n_gpt-4-32k_volume_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_3_n_gpt-4-32k_volume_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_3_p_gpt-4-32k_take-photo_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_4_n_gpt-4-32k_balance-scale-heaviest_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_4_n_gpt-4-32k_balance-scale-heaviest_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_4_p_gpt-4-32k_cooking_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_4_p_gpt-4-32k_cooking_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_5_n_gpt-4-32k_sweep-floor_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_5_n_gpt-4-32k_sweep-floor_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_5_p_gpt-4-32k_dishwasher_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_5_p_gpt-4-32k_dishwasher_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_5_p_gpt-4-32k_dishwasher_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_5_p_gpt-4-32k_dishwasher_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_6_n_gpt-4-32k_wash-clothes_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_6_n_gpt-4-32k_wash-clothes_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_6_p_gpt-4-32k_conductivity_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_7_n_gpt-4-32k_volume-container_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_7_p_gpt-4-32k_dishwasher_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_7_p_gpt-4-32k_dishwasher_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_7_p_gpt-4-32k_dishwasher_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_7_p_gpt-4-32k_dishwasher_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_8_n_gpt-4-32k_plant-tree_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_8_n_gpt-4-32k_plant-tree_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_8_p_gpt-4-32k_sunburn_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_9_n_gpt-4-32k_scale-weigh_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_9_p_gpt-4-32k_volume_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_9_p_gpt-4-32k_volume_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_action_test_9_p_gpt-4-32k_volume_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_action_test_9_p_gpt-4-32k_volume_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_10_p_gpt-4-32k_make-campfire_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_11_p_gpt-4-32k_sweep-floor_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_11_p_gpt-4-32k_sweep-floor_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_12_n_gpt-4-32k_space-walk_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_12_p_gpt-4-32k_volume_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_12_p_gpt-4-32k_volume_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_13_p_gpt-4-32k_multimeter_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_13_p_gpt-4-32k_multimeter_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_13_p_gpt-4-32k_multimeter_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_13_p_gpt-4-32k_multimeter_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_14_n_gpt-4-32k_volume-stone_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_15_n_gpt-4-32k_space-walk_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_15_p_gpt-4-32k_dishwasher_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_16_n_gpt-4-32k_lit-lightbulb_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_16_p_gpt-4-32k_plant-tree_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_1_n_gpt-4-32k_use-bandage_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_1_p_gpt-4-32k_bird-life-cycle_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_2_n_gpt-4-32k_lit-lightbulb_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_2_p_gpt-4-32k_make-ice-cubes_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_3_p_gpt-4-32k_sunburn_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_4_p_gpt-4-32k_metal-detector_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_5_n_gpt-4-32k_lit-lightbulb_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_5_p_gpt-4-32k_make-ice-cubes_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_6_n_gpt-4-32k_clean-energy_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_6_n_gpt-4-32k_clean-energy_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_6_p_gpt-4-32k_scale-weigh_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_6_p_gpt-4-32k_scale-weigh_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_7_n_gpt-4-32k_clean-energy_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_7_p_gpt-4-32k_refrigerate-food_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_8_n_gpt-4-32k_conductivity_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_8_n_gpt-4-32k_conductivity_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_8_p_gpt-4-32k_dishwasher_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_9_n_gpt-4-32k_volume-stone_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_9_p_gpt-4-32k_cooking_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_9_p_gpt-4-32k_cooking_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_distractor_test_9_p_gpt-4-32k_cooking_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_distractor_test_9_p_gpt-4-32k_cooking_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_10_n_gpt-4-32k_metal-detector_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_10_n_gpt-4-32k_metal-detector_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_10_p_gpt-4-32k_make-ice-cubes_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_11_n_gpt-4-32k_inclined-plane_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_12_n_gpt-4-32k_sunburn_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_12_p_gpt-4-32k_dishwasher_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_13_n_gpt-4-32k_scale-weigh_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_13_p_gpt-4-32k_sunburn_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_14_n_gpt-4-32k_balance-scale-weigh_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_14_p_gpt-4-32k_sweep-floor_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_14_p_gpt-4-32k_sweep-floor_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_15_n_gpt-4-32k_volume_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_15_n_gpt-4-32k_volume_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_15_p_gpt-4-32k_space-walk_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_16_p_gpt-4-32k_balance-scale-weigh_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_1_n_gpt-4-32k_plant-tree_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_1_p_gpt-4-32k_refrigerate-food_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_2_n_gpt-4-32k_take-photo_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_2_p_gpt-4-32k_volume-stone_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_3_n_gpt-4-32k_balance-scale-weigh_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_3_p_gpt-4-32k_wash-clothes_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_3_p_gpt-4-32k_wash-clothes_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_4_n_gpt-4-32k_make-campfire_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_4_p_gpt-4-32k_metal-detector_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_5_n_gpt-4-32k_clean-energy_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_6_n_gpt-4-32k_bird-life-cycle_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_6_n_gpt-4-32k_bird-life-cycle_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_6_p_gpt-4-32k_conductivity_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_6_p_gpt-4-32k_conductivity_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_7_n_gpt-4-32k_hang-painting_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_7_p_gpt-4-32k_boil-water_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_7_p_gpt-4-32k_boil-water_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_8_n_gpt-4-32k_volume_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_8_n_gpt-4-32k_volume_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation_v1.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation_v2.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_8_p_gpt-4-32k_sunburn_generation_v3.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_9_n_gpt-4-32k_lit-lightbulb_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_9_n_gpt-4-32k_lit-lightbulb_generation_v0.py -------------------------------------------------------------------------------- /results/GPT-4-32k/revised_games/0512_object_test_9_p_gpt-4-32k_volume_generation_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/results/GPT-4-32k/revised_games/0512_object_test_9_p_gpt-4-32k_volume_generation_v0.py -------------------------------------------------------------------------------- /scripts/generate_experiment_file.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/scripts/generate_experiment_file.py -------------------------------------------------------------------------------- /scripts/make_figure4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/scripts/make_figure4.py -------------------------------------------------------------------------------- /scripts/make_table2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/scripts/make_table2.py -------------------------------------------------------------------------------- /scripts/make_table3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/scripts/make_table3.py -------------------------------------------------------------------------------- /scripts/run_code_evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/scripts/run_code_evaluation.py -------------------------------------------------------------------------------- /scripts/run_code_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/scripts/run_code_generation.py -------------------------------------------------------------------------------- /scripts/run_code_reflection.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/scripts/run_code_reflection.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cognitiveailab/BYTESIZED32/HEAD/setup.py --------------------------------------------------------------------------------