diff --git a/benches/HumanEval/0_has_close_elements/has_close_elements.dfy b/benches/HumanEval/000_has_close_elements/has_close_elements.dfy similarity index 100% rename from benches/HumanEval/0_has_close_elements/has_close_elements.dfy rename to benches/HumanEval/000_has_close_elements/has_close_elements.dfy diff --git a/benches/HumanEval/0_has_close_elements/has_close_elements.nagini b/benches/HumanEval/000_has_close_elements/has_close_elements.nagini similarity index 100% rename from benches/HumanEval/0_has_close_elements/has_close_elements.nagini rename to benches/HumanEval/000_has_close_elements/has_close_elements.nagini diff --git a/benches/HumanEval/0_has_close_elements/has_close_elements.prompt b/benches/HumanEval/000_has_close_elements/has_close_elements.prompt similarity index 100% rename from benches/HumanEval/0_has_close_elements/has_close_elements.prompt rename to benches/HumanEval/000_has_close_elements/has_close_elements.prompt diff --git a/benches/HumanEval/0_has_close_elements/has_close_elements.py b/benches/HumanEval/000_has_close_elements/has_close_elements.py similarity index 100% rename from benches/HumanEval/0_has_close_elements/has_close_elements.py rename to benches/HumanEval/000_has_close_elements/has_close_elements.py diff --git a/benches/HumanEval/0_has_close_elements/has_close_elements.vpr b/benches/HumanEval/000_has_close_elements/has_close_elements.vpr similarity index 100% rename from benches/HumanEval/0_has_close_elements/has_close_elements.vpr rename to benches/HumanEval/000_has_close_elements/has_close_elements.vpr diff --git a/benches/HumanEval/0_has_close_elements/has_close_elements_wo.dfy b/benches/HumanEval/000_has_close_elements/has_close_elements_wo.dfy similarity index 100% rename from benches/HumanEval/0_has_close_elements/has_close_elements_wo.dfy rename to benches/HumanEval/000_has_close_elements/has_close_elements_wo.dfy diff --git a/benches/HumanEval/1_separate_paren_groups/separate_paren_groups.dfy b/benches/HumanEval/001_separate_paren_groups/separate_paren_groups.dfy similarity index 100% rename from benches/HumanEval/1_separate_paren_groups/separate_paren_groups.dfy rename to benches/HumanEval/001_separate_paren_groups/separate_paren_groups.dfy diff --git a/benches/HumanEval/1_separate_paren_groups/separate_paren_groups.prompt b/benches/HumanEval/001_separate_paren_groups/separate_paren_groups.prompt similarity index 100% rename from benches/HumanEval/1_separate_paren_groups/separate_paren_groups.prompt rename to benches/HumanEval/001_separate_paren_groups/separate_paren_groups.prompt diff --git a/benches/HumanEval/1_separate_paren_groups/separate_paren_groups.py b/benches/HumanEval/001_separate_paren_groups/separate_paren_groups.py similarity index 100% rename from benches/HumanEval/1_separate_paren_groups/separate_paren_groups.py rename to benches/HumanEval/001_separate_paren_groups/separate_paren_groups.py diff --git a/benches/HumanEval/2_truncate/truncate.py b/benches/HumanEval/002_truncate/truncate.py similarity index 100% rename from benches/HumanEval/2_truncate/truncate.py rename to benches/HumanEval/002_truncate/truncate.py diff --git a/benches/HumanEval/3_below_zero/below_zero.prompt b/benches/HumanEval/003_below_zero/below_zero.prompt similarity index 100% rename from benches/HumanEval/3_below_zero/below_zero.prompt rename to benches/HumanEval/003_below_zero/below_zero.prompt diff --git a/benches/HumanEval/3_below_zero/below_zero.py b/benches/HumanEval/003_below_zero/below_zero.py similarity index 100% rename from benches/HumanEval/3_below_zero/below_zero.py rename to benches/HumanEval/003_below_zero/below_zero.py diff --git a/benches/HumanEval/4_mean_absolute_derivation/mean_absolute_derivation.prompt b/benches/HumanEval/004_mean_absolute_derivation/mean_absolute_derivation.prompt similarity index 100% rename from benches/HumanEval/4_mean_absolute_derivation/mean_absolute_derivation.prompt rename to benches/HumanEval/004_mean_absolute_derivation/mean_absolute_derivation.prompt diff --git a/benches/HumanEval/4_mean_absolute_derivation/mean_absolute_derivation.py b/benches/HumanEval/004_mean_absolute_derivation/mean_absolute_derivation.py similarity index 100% rename from benches/HumanEval/4_mean_absolute_derivation/mean_absolute_derivation.py rename to benches/HumanEval/004_mean_absolute_derivation/mean_absolute_derivation.py diff --git a/benches/HumanEval/5_intersperse/intersperse.dfy b/benches/HumanEval/005_intersperse/intersperse.dfy similarity index 100% rename from benches/HumanEval/5_intersperse/intersperse.dfy rename to benches/HumanEval/005_intersperse/intersperse.dfy diff --git a/benches/HumanEval/5_intersperse/intersperse.nagini b/benches/HumanEval/005_intersperse/intersperse.nagini similarity index 100% rename from benches/HumanEval/5_intersperse/intersperse.nagini rename to benches/HumanEval/005_intersperse/intersperse.nagini diff --git a/benches/HumanEval/5_intersperse/intersperse.prompt b/benches/HumanEval/005_intersperse/intersperse.prompt similarity index 100% rename from benches/HumanEval/5_intersperse/intersperse.prompt rename to benches/HumanEval/005_intersperse/intersperse.prompt diff --git a/benches/HumanEval/5_intersperse/intersperse.py b/benches/HumanEval/005_intersperse/intersperse.py similarity index 100% rename from benches/HumanEval/5_intersperse/intersperse.py rename to benches/HumanEval/005_intersperse/intersperse.py diff --git a/benches/HumanEval/5_intersperse/intersperse.vpr b/benches/HumanEval/005_intersperse/intersperse.vpr similarity index 100% rename from benches/HumanEval/5_intersperse/intersperse.vpr rename to benches/HumanEval/005_intersperse/intersperse.vpr diff --git a/benches/HumanEval/6_parse_nested_parens/parse_nested_parens.dfy b/benches/HumanEval/006_parse_nested_parens/parse_nested_parens.dfy similarity index 100% rename from benches/HumanEval/6_parse_nested_parens/parse_nested_parens.dfy rename to benches/HumanEval/006_parse_nested_parens/parse_nested_parens.dfy diff --git a/benches/HumanEval/6_parse_nested_parens/parse_nested_parens.prompt b/benches/HumanEval/006_parse_nested_parens/parse_nested_parens.prompt similarity index 100% rename from benches/HumanEval/6_parse_nested_parens/parse_nested_parens.prompt rename to benches/HumanEval/006_parse_nested_parens/parse_nested_parens.prompt diff --git a/benches/HumanEval/6_parse_nested_parens/parse_nested_parens.py b/benches/HumanEval/006_parse_nested_parens/parse_nested_parens.py similarity index 100% rename from benches/HumanEval/6_parse_nested_parens/parse_nested_parens.py rename to benches/HumanEval/006_parse_nested_parens/parse_nested_parens.py diff --git a/benches/HumanEval/7_filter_by_substring/filter_by_substring.dfy b/benches/HumanEval/007_filter_by_substring/filter_by_substring.dfy similarity index 100% rename from benches/HumanEval/7_filter_by_substring/filter_by_substring.dfy rename to benches/HumanEval/007_filter_by_substring/filter_by_substring.dfy diff --git a/benches/HumanEval/7_filter_by_substring/filter_by_substring.prompt b/benches/HumanEval/007_filter_by_substring/filter_by_substring.prompt similarity index 100% rename from benches/HumanEval/7_filter_by_substring/filter_by_substring.prompt rename to benches/HumanEval/007_filter_by_substring/filter_by_substring.prompt diff --git a/benches/HumanEval/7_filter_by_substring/filter_by_substring.py b/benches/HumanEval/007_filter_by_substring/filter_by_substring.py similarity index 100% rename from benches/HumanEval/7_filter_by_substring/filter_by_substring.py rename to benches/HumanEval/007_filter_by_substring/filter_by_substring.py diff --git a/benches/HumanEval/8_sum_product/sum_product.prompt b/benches/HumanEval/008_sum_product/sum_product.prompt similarity index 100% rename from benches/HumanEval/8_sum_product/sum_product.prompt rename to benches/HumanEval/008_sum_product/sum_product.prompt diff --git a/benches/HumanEval/8_sum_product/sum_product.py b/benches/HumanEval/008_sum_product/sum_product.py similarity index 100% rename from benches/HumanEval/8_sum_product/sum_product.py rename to benches/HumanEval/008_sum_product/sum_product.py diff --git a/benches/HumanEval/9_rolling_max/rolling_max.dfy b/benches/HumanEval/009_rolling_max/rolling_max.dfy similarity index 100% rename from benches/HumanEval/9_rolling_max/rolling_max.dfy rename to benches/HumanEval/009_rolling_max/rolling_max.dfy diff --git a/benches/HumanEval/9_rolling_max/rolling_max.nagini b/benches/HumanEval/009_rolling_max/rolling_max.nagini similarity index 100% rename from benches/HumanEval/9_rolling_max/rolling_max.nagini rename to benches/HumanEval/009_rolling_max/rolling_max.nagini diff --git a/benches/HumanEval/9_rolling_max/rolling_max.prompt b/benches/HumanEval/009_rolling_max/rolling_max.prompt similarity index 100% rename from benches/HumanEval/9_rolling_max/rolling_max.prompt rename to benches/HumanEval/009_rolling_max/rolling_max.prompt diff --git a/benches/HumanEval/9_rolling_max/rolling_max.py b/benches/HumanEval/009_rolling_max/rolling_max.py similarity index 100% rename from benches/HumanEval/9_rolling_max/rolling_max.py rename to benches/HumanEval/009_rolling_max/rolling_max.py diff --git a/benches/HumanEval/9_rolling_max/rolling_max.vpr b/benches/HumanEval/009_rolling_max/rolling_max.vpr similarity index 100% rename from benches/HumanEval/9_rolling_max/rolling_max.vpr rename to benches/HumanEval/009_rolling_max/rolling_max.vpr diff --git a/benches/HumanEval/10_is_palindrome/is_palindrome.dfy b/benches/HumanEval/010_is_palindrome/is_palindrome.dfy similarity index 100% rename from benches/HumanEval/10_is_palindrome/is_palindrome.dfy rename to benches/HumanEval/010_is_palindrome/is_palindrome.dfy diff --git a/benches/HumanEval/10_is_palindrome/is_palindrome.prompt b/benches/HumanEval/010_is_palindrome/is_palindrome.prompt similarity index 100% rename from benches/HumanEval/10_is_palindrome/is_palindrome.prompt rename to benches/HumanEval/010_is_palindrome/is_palindrome.prompt diff --git a/benches/HumanEval/10_is_palindrome/is_palindrome.py b/benches/HumanEval/010_is_palindrome/is_palindrome.py similarity index 100% rename from benches/HumanEval/10_is_palindrome/is_palindrome.py rename to benches/HumanEval/010_is_palindrome/is_palindrome.py diff --git a/benches/HumanEval/11_string_xor/string_xor.dfy b/benches/HumanEval/011_string_xor/string_xor.dfy similarity index 100% rename from benches/HumanEval/11_string_xor/string_xor.dfy rename to benches/HumanEval/011_string_xor/string_xor.dfy diff --git a/benches/HumanEval/11_string_xor/string_xor.prompt b/benches/HumanEval/011_string_xor/string_xor.prompt similarity index 100% rename from benches/HumanEval/11_string_xor/string_xor.prompt rename to benches/HumanEval/011_string_xor/string_xor.prompt diff --git a/benches/HumanEval/11_string_xor/string_xor.py b/benches/HumanEval/011_string_xor/string_xor.py similarity index 100% rename from benches/HumanEval/11_string_xor/string_xor.py rename to benches/HumanEval/011_string_xor/string_xor.py diff --git a/benches/HumanEval/12_longest/longest.dfy b/benches/HumanEval/012_longest/longest.dfy similarity index 100% rename from benches/HumanEval/12_longest/longest.dfy rename to benches/HumanEval/012_longest/longest.dfy diff --git a/benches/HumanEval/12_longest/longest.prompt b/benches/HumanEval/012_longest/longest.prompt similarity index 100% rename from benches/HumanEval/12_longest/longest.prompt rename to benches/HumanEval/012_longest/longest.prompt diff --git a/benches/HumanEval/12_longest/longest.py b/benches/HumanEval/012_longest/longest.py similarity index 100% rename from benches/HumanEval/12_longest/longest.py rename to benches/HumanEval/012_longest/longest.py diff --git a/benches/HumanEval/12_longest/longest1.dfy b/benches/HumanEval/012_longest/longest1.dfy similarity index 100% rename from benches/HumanEval/12_longest/longest1.dfy rename to benches/HumanEval/012_longest/longest1.dfy diff --git a/benches/HumanEval/13_greatest_common_divisor/greates_common_divisor.nagini b/benches/HumanEval/013_greatest_common_divisor/greates_common_divisor.nagini similarity index 100% rename from benches/HumanEval/13_greatest_common_divisor/greates_common_divisor.nagini rename to benches/HumanEval/013_greatest_common_divisor/greates_common_divisor.nagini diff --git a/benches/HumanEval/13_greatest_common_divisor/greatest_common_divisor.dfy b/benches/HumanEval/013_greatest_common_divisor/greatest_common_divisor.dfy similarity index 100% rename from benches/HumanEval/13_greatest_common_divisor/greatest_common_divisor.dfy rename to benches/HumanEval/013_greatest_common_divisor/greatest_common_divisor.dfy diff --git a/benches/HumanEval/13_greatest_common_divisor/greatest_common_divisor.prompt b/benches/HumanEval/013_greatest_common_divisor/greatest_common_divisor.prompt similarity index 100% rename from benches/HumanEval/13_greatest_common_divisor/greatest_common_divisor.prompt rename to benches/HumanEval/013_greatest_common_divisor/greatest_common_divisor.prompt diff --git a/benches/HumanEval/13_greatest_common_divisor/greatest_common_divisor.py b/benches/HumanEval/013_greatest_common_divisor/greatest_common_divisor.py similarity index 100% rename from benches/HumanEval/13_greatest_common_divisor/greatest_common_divisor.py rename to benches/HumanEval/013_greatest_common_divisor/greatest_common_divisor.py diff --git a/benches/HumanEval/13_greatest_common_divisor/greatest_common_divisor.vpr b/benches/HumanEval/013_greatest_common_divisor/greatest_common_divisor.vpr similarity index 100% rename from benches/HumanEval/13_greatest_common_divisor/greatest_common_divisor.vpr rename to benches/HumanEval/013_greatest_common_divisor/greatest_common_divisor.vpr diff --git a/benches/HumanEval/14_all_prefixes/all_prefixes.dfy b/benches/HumanEval/014_all_prefixes/all_prefixes.dfy similarity index 100% rename from benches/HumanEval/14_all_prefixes/all_prefixes.dfy rename to benches/HumanEval/014_all_prefixes/all_prefixes.dfy diff --git a/benches/HumanEval/14_all_prefixes/all_prefixes.prompt b/benches/HumanEval/014_all_prefixes/all_prefixes.prompt similarity index 100% rename from benches/HumanEval/14_all_prefixes/all_prefixes.prompt rename to benches/HumanEval/014_all_prefixes/all_prefixes.prompt diff --git a/benches/HumanEval/14_all_prefixes/all_prefixes.py b/benches/HumanEval/014_all_prefixes/all_prefixes.py similarity index 100% rename from benches/HumanEval/14_all_prefixes/all_prefixes.py rename to benches/HumanEval/014_all_prefixes/all_prefixes.py diff --git a/benches/HumanEval/15_string_sequence/string_sequence.prompt b/benches/HumanEval/015_string_sequence/string_sequence.prompt similarity index 100% rename from benches/HumanEval/15_string_sequence/string_sequence.prompt rename to benches/HumanEval/015_string_sequence/string_sequence.prompt diff --git a/benches/HumanEval/15_string_sequence/string_sequence.py b/benches/HumanEval/015_string_sequence/string_sequence.py similarity index 100% rename from benches/HumanEval/15_string_sequence/string_sequence.py rename to benches/HumanEval/015_string_sequence/string_sequence.py diff --git a/benches/HumanEval/16_count_distinct_characters/count_distinct_characters.prompt b/benches/HumanEval/016_count_distinct_characters/count_distinct_characters.prompt similarity index 100% rename from benches/HumanEval/16_count_distinct_characters/count_distinct_characters.prompt rename to benches/HumanEval/016_count_distinct_characters/count_distinct_characters.prompt diff --git a/benches/HumanEval/16_count_distinct_characters/count_distinct_characters.py b/benches/HumanEval/016_count_distinct_characters/count_distinct_characters.py similarity index 100% rename from benches/HumanEval/16_count_distinct_characters/count_distinct_characters.py rename to benches/HumanEval/016_count_distinct_characters/count_distinct_characters.py diff --git a/benches/HumanEval/17_parse_music/parse_music.prompt b/benches/HumanEval/017_parse_music/parse_music.prompt similarity index 100% rename from benches/HumanEval/17_parse_music/parse_music.prompt rename to benches/HumanEval/017_parse_music/parse_music.prompt diff --git a/benches/HumanEval/17_parse_music/parse_music.py b/benches/HumanEval/017_parse_music/parse_music.py similarity index 100% rename from benches/HumanEval/17_parse_music/parse_music.py rename to benches/HumanEval/017_parse_music/parse_music.py diff --git a/benches/HumanEval/18_how_many_times/how_many_times.prompt b/benches/HumanEval/018_how_many_times/how_many_times.prompt similarity index 100% rename from benches/HumanEval/18_how_many_times/how_many_times.prompt rename to benches/HumanEval/018_how_many_times/how_many_times.prompt diff --git a/benches/HumanEval/18_how_many_times/how_many_times.py b/benches/HumanEval/018_how_many_times/how_many_times.py similarity index 100% rename from benches/HumanEval/18_how_many_times/how_many_times.py rename to benches/HumanEval/018_how_many_times/how_many_times.py diff --git a/benches/HumanEval/19_sort_numbers/sort_numbers.prompt b/benches/HumanEval/019_sort_numbers/sort_numbers.prompt similarity index 100% rename from benches/HumanEval/19_sort_numbers/sort_numbers.prompt rename to benches/HumanEval/019_sort_numbers/sort_numbers.prompt diff --git a/benches/HumanEval/19_sort_numbers/sort_numbers.py b/benches/HumanEval/019_sort_numbers/sort_numbers.py similarity index 100% rename from benches/HumanEval/19_sort_numbers/sort_numbers.py rename to benches/HumanEval/019_sort_numbers/sort_numbers.py diff --git a/benches/HumanEval/20_find_closest_elements/find_closest_elements.prompt b/benches/HumanEval/020_find_closest_elements/find_closest_elements.prompt similarity index 100% rename from benches/HumanEval/20_find_closest_elements/find_closest_elements.prompt rename to benches/HumanEval/020_find_closest_elements/find_closest_elements.prompt diff --git a/benches/HumanEval/20_find_closest_elements/find_closest_elements.py b/benches/HumanEval/020_find_closest_elements/find_closest_elements.py similarity index 100% rename from benches/HumanEval/20_find_closest_elements/find_closest_elements.py rename to benches/HumanEval/020_find_closest_elements/find_closest_elements.py diff --git a/benches/HumanEval/21_rescale_to_unit/rescale_to_unit.prompt b/benches/HumanEval/021_rescale_to_unit/rescale_to_unit.prompt similarity index 100% rename from benches/HumanEval/21_rescale_to_unit/rescale_to_unit.prompt rename to benches/HumanEval/021_rescale_to_unit/rescale_to_unit.prompt diff --git a/benches/HumanEval/21_rescale_to_unit/rescale_to_unit.py b/benches/HumanEval/021_rescale_to_unit/rescale_to_unit.py similarity index 100% rename from benches/HumanEval/21_rescale_to_unit/rescale_to_unit.py rename to benches/HumanEval/021_rescale_to_unit/rescale_to_unit.py diff --git a/benches/HumanEval/22_filter_integers/filter_integers.prompt b/benches/HumanEval/022_filter_integers/filter_integers.prompt similarity index 100% rename from benches/HumanEval/22_filter_integers/filter_integers.prompt rename to benches/HumanEval/022_filter_integers/filter_integers.prompt diff --git a/benches/HumanEval/22_filter_integers/filter_integers.py b/benches/HumanEval/022_filter_integers/filter_integers.py similarity index 100% rename from benches/HumanEval/22_filter_integers/filter_integers.py rename to benches/HumanEval/022_filter_integers/filter_integers.py diff --git a/benches/HumanEval/23_strlen/strlen.prompt b/benches/HumanEval/023_strlen/strlen.prompt similarity index 100% rename from benches/HumanEval/23_strlen/strlen.prompt rename to benches/HumanEval/023_strlen/strlen.prompt diff --git a/benches/HumanEval/23_strlen/strlen.py b/benches/HumanEval/023_strlen/strlen.py similarity index 100% rename from benches/HumanEval/23_strlen/strlen.py rename to benches/HumanEval/023_strlen/strlen.py diff --git a/benches/HumanEval/24_largest_divisor/largest_divisor.prompt b/benches/HumanEval/024_largest_divisor/largest_divisor.prompt similarity index 100% rename from benches/HumanEval/24_largest_divisor/largest_divisor.prompt rename to benches/HumanEval/024_largest_divisor/largest_divisor.prompt diff --git a/benches/HumanEval/24_largest_divisor/largest_divisor.py b/benches/HumanEval/024_largest_divisor/largest_divisor.py similarity index 100% rename from benches/HumanEval/24_largest_divisor/largest_divisor.py rename to benches/HumanEval/024_largest_divisor/largest_divisor.py diff --git a/benches/HumanEval/25_factorize/factorize.prompt b/benches/HumanEval/025_factorize/factorize.prompt similarity index 100% rename from benches/HumanEval/25_factorize/factorize.prompt rename to benches/HumanEval/025_factorize/factorize.prompt diff --git a/benches/HumanEval/25_factorize/factorize.py b/benches/HumanEval/025_factorize/factorize.py similarity index 100% rename from benches/HumanEval/25_factorize/factorize.py rename to benches/HumanEval/025_factorize/factorize.py diff --git a/benches/HumanEval/26_remove_duplicates/remove_duplicates.prompt b/benches/HumanEval/026_remove_duplicates/remove_duplicates.prompt similarity index 100% rename from benches/HumanEval/26_remove_duplicates/remove_duplicates.prompt rename to benches/HumanEval/026_remove_duplicates/remove_duplicates.prompt diff --git a/benches/HumanEval/26_remove_duplicates/remove_duplicates.py b/benches/HumanEval/026_remove_duplicates/remove_duplicates.py similarity index 100% rename from benches/HumanEval/26_remove_duplicates/remove_duplicates.py rename to benches/HumanEval/026_remove_duplicates/remove_duplicates.py diff --git a/benches/HumanEval/27_flip_case/flip_case.prompt b/benches/HumanEval/027_flip_case/flip_case.prompt similarity index 100% rename from benches/HumanEval/27_flip_case/flip_case.prompt rename to benches/HumanEval/027_flip_case/flip_case.prompt diff --git a/benches/HumanEval/27_flip_case/flip_case.py b/benches/HumanEval/027_flip_case/flip_case.py similarity index 100% rename from benches/HumanEval/27_flip_case/flip_case.py rename to benches/HumanEval/027_flip_case/flip_case.py diff --git a/benches/HumanEval/28_concatenate/concatenate.prompt b/benches/HumanEval/028_concatenate/concatenate.prompt similarity index 100% rename from benches/HumanEval/28_concatenate/concatenate.prompt rename to benches/HumanEval/028_concatenate/concatenate.prompt diff --git a/benches/HumanEval/28_concatenate/concatenate.py b/benches/HumanEval/028_concatenate/concatenate.py similarity index 100% rename from benches/HumanEval/28_concatenate/concatenate.py rename to benches/HumanEval/028_concatenate/concatenate.py diff --git a/benches/HumanEval/29_filter_by_prefix/filter_by_prefix.prompt b/benches/HumanEval/029_filter_by_prefix/filter_by_prefix.prompt similarity index 100% rename from benches/HumanEval/29_filter_by_prefix/filter_by_prefix.prompt rename to benches/HumanEval/029_filter_by_prefix/filter_by_prefix.prompt diff --git a/benches/HumanEval/29_filter_by_prefix/filter_by_prefix.py b/benches/HumanEval/029_filter_by_prefix/filter_by_prefix.py similarity index 100% rename from benches/HumanEval/29_filter_by_prefix/filter_by_prefix.py rename to benches/HumanEval/029_filter_by_prefix/filter_by_prefix.py diff --git a/benches/HumanEval/30_get_positive/get_positive.prompt b/benches/HumanEval/030_get_positive/get_positive.prompt similarity index 100% rename from benches/HumanEval/30_get_positive/get_positive.prompt rename to benches/HumanEval/030_get_positive/get_positive.prompt diff --git a/benches/HumanEval/30_get_positive/get_positive.py b/benches/HumanEval/030_get_positive/get_positive.py similarity index 100% rename from benches/HumanEval/30_get_positive/get_positive.py rename to benches/HumanEval/030_get_positive/get_positive.py diff --git a/benches/HumanEval/31_is_prime/is_prime.prompt b/benches/HumanEval/031_is_prime/is_prime.prompt similarity index 100% rename from benches/HumanEval/31_is_prime/is_prime.prompt rename to benches/HumanEval/031_is_prime/is_prime.prompt diff --git a/benches/HumanEval/31_is_prime/is_prime.py b/benches/HumanEval/031_is_prime/is_prime.py similarity index 100% rename from benches/HumanEval/31_is_prime/is_prime.py rename to benches/HumanEval/031_is_prime/is_prime.py diff --git a/benches/HumanEval/32_poly/poly.prompt b/benches/HumanEval/032_poly/poly.prompt similarity index 100% rename from benches/HumanEval/32_poly/poly.prompt rename to benches/HumanEval/032_poly/poly.prompt diff --git a/benches/HumanEval/32_poly/poly.py b/benches/HumanEval/032_poly/poly.py similarity index 100% rename from benches/HumanEval/32_poly/poly.py rename to benches/HumanEval/032_poly/poly.py diff --git a/benches/HumanEval/33_sort_third/sort_third.prompt b/benches/HumanEval/033_sort_third/sort_third.prompt similarity index 100% rename from benches/HumanEval/33_sort_third/sort_third.prompt rename to benches/HumanEval/033_sort_third/sort_third.prompt diff --git a/benches/HumanEval/33_sort_third/sort_third.py b/benches/HumanEval/033_sort_third/sort_third.py similarity index 100% rename from benches/HumanEval/33_sort_third/sort_third.py rename to benches/HumanEval/033_sort_third/sort_third.py diff --git a/benches/HumanEval/34_unique/unique.prompt b/benches/HumanEval/034_unique/unique.prompt similarity index 100% rename from benches/HumanEval/34_unique/unique.prompt rename to benches/HumanEval/034_unique/unique.prompt diff --git a/benches/HumanEval/34_unique/unique.py b/benches/HumanEval/034_unique/unique.py similarity index 100% rename from benches/HumanEval/34_unique/unique.py rename to benches/HumanEval/034_unique/unique.py diff --git a/benches/HumanEval/35_max_element/max_element.prompt b/benches/HumanEval/035_max_element/max_element.prompt similarity index 100% rename from benches/HumanEval/35_max_element/max_element.prompt rename to benches/HumanEval/035_max_element/max_element.prompt diff --git a/benches/HumanEval/35_max_element/max_element.py b/benches/HumanEval/035_max_element/max_element.py similarity index 100% rename from benches/HumanEval/35_max_element/max_element.py rename to benches/HumanEval/035_max_element/max_element.py diff --git a/benches/HumanEval/36_fizz_buzz/fizz_buzz.prompt b/benches/HumanEval/036_fizz_buzz/fizz_buzz.prompt similarity index 100% rename from benches/HumanEval/36_fizz_buzz/fizz_buzz.prompt rename to benches/HumanEval/036_fizz_buzz/fizz_buzz.prompt diff --git a/benches/HumanEval/36_fizz_buzz/fizz_buzz.py b/benches/HumanEval/036_fizz_buzz/fizz_buzz.py similarity index 100% rename from benches/HumanEval/36_fizz_buzz/fizz_buzz.py rename to benches/HumanEval/036_fizz_buzz/fizz_buzz.py diff --git a/benches/HumanEval/37_sort_even/sort_even.prompt b/benches/HumanEval/037_sort_even/sort_even.prompt similarity index 100% rename from benches/HumanEval/37_sort_even/sort_even.prompt rename to benches/HumanEval/037_sort_even/sort_even.prompt diff --git a/benches/HumanEval/37_sort_even/sort_even.py b/benches/HumanEval/037_sort_even/sort_even.py similarity index 100% rename from benches/HumanEval/37_sort_even/sort_even.py rename to benches/HumanEval/037_sort_even/sort_even.py diff --git a/benches/HumanEval/38_encode_cyclic/encode_cyclic.prompt b/benches/HumanEval/038_encode_cyclic/encode_cyclic.prompt similarity index 100% rename from benches/HumanEval/38_encode_cyclic/encode_cyclic.prompt rename to benches/HumanEval/038_encode_cyclic/encode_cyclic.prompt diff --git a/benches/HumanEval/38_encode_cyclic/encode_cyclic.py b/benches/HumanEval/038_encode_cyclic/encode_cyclic.py similarity index 100% rename from benches/HumanEval/38_encode_cyclic/encode_cyclic.py rename to benches/HumanEval/038_encode_cyclic/encode_cyclic.py diff --git a/benches/HumanEval/39_prime_fib/prime_fib.prompt b/benches/HumanEval/039_prime_fib/prime_fib.prompt similarity index 100% rename from benches/HumanEval/39_prime_fib/prime_fib.prompt rename to benches/HumanEval/039_prime_fib/prime_fib.prompt diff --git a/benches/HumanEval/39_prime_fib/prime_fib.py b/benches/HumanEval/039_prime_fib/prime_fib.py similarity index 100% rename from benches/HumanEval/39_prime_fib/prime_fib.py rename to benches/HumanEval/039_prime_fib/prime_fib.py diff --git a/benches/HumanEval/40_triples_sum_to_zero/triples_sum_to_zero.prompt b/benches/HumanEval/040_triples_sum_to_zero/triples_sum_to_zero.prompt similarity index 100% rename from benches/HumanEval/40_triples_sum_to_zero/triples_sum_to_zero.prompt rename to benches/HumanEval/040_triples_sum_to_zero/triples_sum_to_zero.prompt diff --git a/benches/HumanEval/40_triples_sum_to_zero/triples_sum_to_zero.py b/benches/HumanEval/040_triples_sum_to_zero/triples_sum_to_zero.py similarity index 100% rename from benches/HumanEval/40_triples_sum_to_zero/triples_sum_to_zero.py rename to benches/HumanEval/040_triples_sum_to_zero/triples_sum_to_zero.py diff --git a/benches/HumanEval/41_car_race_collision/car_race_collision.prompt b/benches/HumanEval/041_car_race_collision/car_race_collision.prompt similarity index 100% rename from benches/HumanEval/41_car_race_collision/car_race_collision.prompt rename to benches/HumanEval/041_car_race_collision/car_race_collision.prompt diff --git a/benches/HumanEval/41_car_race_collision/car_race_collision.py b/benches/HumanEval/041_car_race_collision/car_race_collision.py similarity index 100% rename from benches/HumanEval/41_car_race_collision/car_race_collision.py rename to benches/HumanEval/041_car_race_collision/car_race_collision.py diff --git a/benches/HumanEval/42_incr_list/incr_list.prompt b/benches/HumanEval/042_incr_list/incr_list.prompt similarity index 100% rename from benches/HumanEval/42_incr_list/incr_list.prompt rename to benches/HumanEval/042_incr_list/incr_list.prompt diff --git a/benches/HumanEval/42_incr_list/incr_list.py b/benches/HumanEval/042_incr_list/incr_list.py similarity index 100% rename from benches/HumanEval/42_incr_list/incr_list.py rename to benches/HumanEval/042_incr_list/incr_list.py diff --git a/benches/HumanEval/43_pairs_sum_to_zero/pairs_sum_to_zero.prompt b/benches/HumanEval/043_pairs_sum_to_zero/pairs_sum_to_zero.prompt similarity index 100% rename from benches/HumanEval/43_pairs_sum_to_zero/pairs_sum_to_zero.prompt rename to benches/HumanEval/043_pairs_sum_to_zero/pairs_sum_to_zero.prompt diff --git a/benches/HumanEval/43_pairs_sum_to_zero/pairs_sum_to_zero.py b/benches/HumanEval/043_pairs_sum_to_zero/pairs_sum_to_zero.py similarity index 100% rename from benches/HumanEval/43_pairs_sum_to_zero/pairs_sum_to_zero.py rename to benches/HumanEval/043_pairs_sum_to_zero/pairs_sum_to_zero.py diff --git a/benches/HumanEval/44_change_base/change_base.prompt b/benches/HumanEval/044_change_base/change_base.prompt similarity index 100% rename from benches/HumanEval/44_change_base/change_base.prompt rename to benches/HumanEval/044_change_base/change_base.prompt diff --git a/benches/HumanEval/44_change_base/change_base.py b/benches/HumanEval/044_change_base/change_base.py similarity index 100% rename from benches/HumanEval/44_change_base/change_base.py rename to benches/HumanEval/044_change_base/change_base.py diff --git a/benches/HumanEval/45_triangle_area/triangle_area.prompt b/benches/HumanEval/045_triangle_area/triangle_area.prompt similarity index 100% rename from benches/HumanEval/45_triangle_area/triangle_area.prompt rename to benches/HumanEval/045_triangle_area/triangle_area.prompt diff --git a/benches/HumanEval/45_triangle_area/triangle_area.py b/benches/HumanEval/045_triangle_area/triangle_area.py similarity index 100% rename from benches/HumanEval/45_triangle_area/triangle_area.py rename to benches/HumanEval/045_triangle_area/triangle_area.py diff --git a/benches/HumanEval/46_fib4/fib4.prompt b/benches/HumanEval/046_fib4/fib4.prompt similarity index 100% rename from benches/HumanEval/46_fib4/fib4.prompt rename to benches/HumanEval/046_fib4/fib4.prompt diff --git a/benches/HumanEval/46_fib4/fib4.py b/benches/HumanEval/046_fib4/fib4.py similarity index 100% rename from benches/HumanEval/46_fib4/fib4.py rename to benches/HumanEval/046_fib4/fib4.py diff --git a/benches/HumanEval/47_median/median.prompt b/benches/HumanEval/047_median/median.prompt similarity index 100% rename from benches/HumanEval/47_median/median.prompt rename to benches/HumanEval/047_median/median.prompt diff --git a/benches/HumanEval/47_median/median.py b/benches/HumanEval/047_median/median.py similarity index 100% rename from benches/HumanEval/47_median/median.py rename to benches/HumanEval/047_median/median.py diff --git a/benches/HumanEval/48_is_palindrome/is_palindrome.prompt b/benches/HumanEval/048_is_palindrome/is_palindrome.prompt similarity index 100% rename from benches/HumanEval/48_is_palindrome/is_palindrome.prompt rename to benches/HumanEval/048_is_palindrome/is_palindrome.prompt diff --git a/benches/HumanEval/48_is_palindrome/is_palindrome.py b/benches/HumanEval/048_is_palindrome/is_palindrome.py similarity index 100% rename from benches/HumanEval/48_is_palindrome/is_palindrome.py rename to benches/HumanEval/048_is_palindrome/is_palindrome.py diff --git a/benches/HumanEval/49_modp/modp.prompt b/benches/HumanEval/049_modp/modp.prompt similarity index 100% rename from benches/HumanEval/49_modp/modp.prompt rename to benches/HumanEval/049_modp/modp.prompt diff --git a/benches/HumanEval/49_modp/modp.py b/benches/HumanEval/049_modp/modp.py similarity index 100% rename from benches/HumanEval/49_modp/modp.py rename to benches/HumanEval/049_modp/modp.py diff --git a/benches/HumanEval/50_encode_shift/encode_shift.prompt b/benches/HumanEval/050_encode_shift/encode_shift.prompt similarity index 100% rename from benches/HumanEval/50_encode_shift/encode_shift.prompt rename to benches/HumanEval/050_encode_shift/encode_shift.prompt diff --git a/benches/HumanEval/50_encode_shift/encode_shift.py b/benches/HumanEval/050_encode_shift/encode_shift.py similarity index 100% rename from benches/HumanEval/50_encode_shift/encode_shift.py rename to benches/HumanEval/050_encode_shift/encode_shift.py diff --git a/benches/HumanEval/51_remove_vowels/remove_vowels.prompt b/benches/HumanEval/051_remove_vowels/remove_vowels.prompt similarity index 100% rename from benches/HumanEval/51_remove_vowels/remove_vowels.prompt rename to benches/HumanEval/051_remove_vowels/remove_vowels.prompt diff --git a/benches/HumanEval/51_remove_vowels/remove_vowels.py b/benches/HumanEval/051_remove_vowels/remove_vowels.py similarity index 100% rename from benches/HumanEval/51_remove_vowels/remove_vowels.py rename to benches/HumanEval/051_remove_vowels/remove_vowels.py diff --git a/benches/HumanEval/52_below_threshold/below_threshold.prompt b/benches/HumanEval/052_below_threshold/below_threshold.prompt similarity index 100% rename from benches/HumanEval/52_below_threshold/below_threshold.prompt rename to benches/HumanEval/052_below_threshold/below_threshold.prompt diff --git a/benches/HumanEval/52_below_threshold/below_threshold.py b/benches/HumanEval/052_below_threshold/below_threshold.py similarity index 100% rename from benches/HumanEval/52_below_threshold/below_threshold.py rename to benches/HumanEval/052_below_threshold/below_threshold.py diff --git a/benches/HumanEval/53_add/add.prompt b/benches/HumanEval/053_add/add.prompt similarity index 100% rename from benches/HumanEval/53_add/add.prompt rename to benches/HumanEval/053_add/add.prompt diff --git a/benches/HumanEval/53_add/add.py b/benches/HumanEval/053_add/add.py similarity index 100% rename from benches/HumanEval/53_add/add.py rename to benches/HumanEval/053_add/add.py diff --git a/benches/HumanEval/54_same_chars/same_chars.prompt b/benches/HumanEval/054_same_chars/same_chars.prompt similarity index 100% rename from benches/HumanEval/54_same_chars/same_chars.prompt rename to benches/HumanEval/054_same_chars/same_chars.prompt diff --git a/benches/HumanEval/54_same_chars/same_chars.py b/benches/HumanEval/054_same_chars/same_chars.py similarity index 100% rename from benches/HumanEval/54_same_chars/same_chars.py rename to benches/HumanEval/054_same_chars/same_chars.py diff --git a/benches/HumanEval/55_fib/fib.prompt b/benches/HumanEval/055_fib/fib.prompt similarity index 100% rename from benches/HumanEval/55_fib/fib.prompt rename to benches/HumanEval/055_fib/fib.prompt diff --git a/benches/HumanEval/55_fib/fib.py b/benches/HumanEval/055_fib/fib.py similarity index 100% rename from benches/HumanEval/55_fib/fib.py rename to benches/HumanEval/055_fib/fib.py diff --git a/benches/HumanEval/56_correct_bracketing/correct_bracketing.prompt b/benches/HumanEval/056_correct_bracketing/correct_bracketing.prompt similarity index 100% rename from benches/HumanEval/56_correct_bracketing/correct_bracketing.prompt rename to benches/HumanEval/056_correct_bracketing/correct_bracketing.prompt diff --git a/benches/HumanEval/56_correct_bracketing/correct_bracketing.py b/benches/HumanEval/056_correct_bracketing/correct_bracketing.py similarity index 100% rename from benches/HumanEval/56_correct_bracketing/correct_bracketing.py rename to benches/HumanEval/056_correct_bracketing/correct_bracketing.py diff --git a/benches/HumanEval/57_monotonic/monotonic.prompt b/benches/HumanEval/057_monotonic/monotonic.prompt similarity index 100% rename from benches/HumanEval/57_monotonic/monotonic.prompt rename to benches/HumanEval/057_monotonic/monotonic.prompt diff --git a/benches/HumanEval/57_monotonic/monotonic.py b/benches/HumanEval/057_monotonic/monotonic.py similarity index 100% rename from benches/HumanEval/57_monotonic/monotonic.py rename to benches/HumanEval/057_monotonic/monotonic.py diff --git a/benches/HumanEval/58_common/common.prompt b/benches/HumanEval/058_common/common.prompt similarity index 100% rename from benches/HumanEval/58_common/common.prompt rename to benches/HumanEval/058_common/common.prompt diff --git a/benches/HumanEval/58_common/common.py b/benches/HumanEval/058_common/common.py similarity index 100% rename from benches/HumanEval/58_common/common.py rename to benches/HumanEval/058_common/common.py diff --git a/benches/HumanEval/59_largest_prime_factor/largest_prime_factor.prompt b/benches/HumanEval/059_largest_prime_factor/largest_prime_factor.prompt similarity index 100% rename from benches/HumanEval/59_largest_prime_factor/largest_prime_factor.prompt rename to benches/HumanEval/059_largest_prime_factor/largest_prime_factor.prompt diff --git a/benches/HumanEval/59_largest_prime_factor/largest_prime_factor.py b/benches/HumanEval/059_largest_prime_factor/largest_prime_factor.py similarity index 100% rename from benches/HumanEval/59_largest_prime_factor/largest_prime_factor.py rename to benches/HumanEval/059_largest_prime_factor/largest_prime_factor.py diff --git a/benches/HumanEval/60_sum_to_n/sum_to_n.prompt b/benches/HumanEval/060_sum_to_n/sum_to_n.prompt similarity index 100% rename from benches/HumanEval/60_sum_to_n/sum_to_n.prompt rename to benches/HumanEval/060_sum_to_n/sum_to_n.prompt diff --git a/benches/HumanEval/60_sum_to_n/sum_to_n.py b/benches/HumanEval/060_sum_to_n/sum_to_n.py similarity index 100% rename from benches/HumanEval/60_sum_to_n/sum_to_n.py rename to benches/HumanEval/060_sum_to_n/sum_to_n.py diff --git a/benches/HumanEval/61_correct_bracketing/correct_bracketing.prompt b/benches/HumanEval/061_correct_bracketing/correct_bracketing.prompt similarity index 100% rename from benches/HumanEval/61_correct_bracketing/correct_bracketing.prompt rename to benches/HumanEval/061_correct_bracketing/correct_bracketing.prompt diff --git a/benches/HumanEval/61_correct_bracketing/correct_bracketing.py b/benches/HumanEval/061_correct_bracketing/correct_bracketing.py similarity index 100% rename from benches/HumanEval/61_correct_bracketing/correct_bracketing.py rename to benches/HumanEval/061_correct_bracketing/correct_bracketing.py diff --git a/benches/HumanEval/62_derivative/derivative.prompt b/benches/HumanEval/062_derivative/derivative.prompt similarity index 100% rename from benches/HumanEval/62_derivative/derivative.prompt rename to benches/HumanEval/062_derivative/derivative.prompt diff --git a/benches/HumanEval/62_derivative/derivative.py b/benches/HumanEval/062_derivative/derivative.py similarity index 100% rename from benches/HumanEval/62_derivative/derivative.py rename to benches/HumanEval/062_derivative/derivative.py diff --git a/benches/HumanEval/63_fibfib/fibfib.prompt b/benches/HumanEval/063_fibfib/fibfib.prompt similarity index 100% rename from benches/HumanEval/63_fibfib/fibfib.prompt rename to benches/HumanEval/063_fibfib/fibfib.prompt diff --git a/benches/HumanEval/63_fibfib/fibfib.py b/benches/HumanEval/063_fibfib/fibfib.py similarity index 100% rename from benches/HumanEval/63_fibfib/fibfib.py rename to benches/HumanEval/063_fibfib/fibfib.py diff --git a/benches/HumanEval/64_vowels_count/vowels_count.prompt b/benches/HumanEval/064_vowels_count/vowels_count.prompt similarity index 100% rename from benches/HumanEval/64_vowels_count/vowels_count.prompt rename to benches/HumanEval/064_vowels_count/vowels_count.prompt diff --git a/benches/HumanEval/64_vowels_count/vowels_count.py b/benches/HumanEval/064_vowels_count/vowels_count.py similarity index 100% rename from benches/HumanEval/64_vowels_count/vowels_count.py rename to benches/HumanEval/064_vowels_count/vowels_count.py diff --git a/benches/HumanEval/65_circular_shift/circular_shift.prompt b/benches/HumanEval/065_circular_shift/circular_shift.prompt similarity index 100% rename from benches/HumanEval/65_circular_shift/circular_shift.prompt rename to benches/HumanEval/065_circular_shift/circular_shift.prompt diff --git a/benches/HumanEval/65_circular_shift/circular_shift.py b/benches/HumanEval/065_circular_shift/circular_shift.py similarity index 100% rename from benches/HumanEval/65_circular_shift/circular_shift.py rename to benches/HumanEval/065_circular_shift/circular_shift.py diff --git a/benches/HumanEval/66_digitSum/digitSum.prompt b/benches/HumanEval/066_digitSum/digitSum.prompt similarity index 100% rename from benches/HumanEval/66_digitSum/digitSum.prompt rename to benches/HumanEval/066_digitSum/digitSum.prompt diff --git a/benches/HumanEval/66_digitSum/digitSum.py b/benches/HumanEval/066_digitSum/digitSum.py similarity index 100% rename from benches/HumanEval/66_digitSum/digitSum.py rename to benches/HumanEval/066_digitSum/digitSum.py diff --git a/benches/HumanEval/67_fruit_distribution/fruit_distribution.prompt b/benches/HumanEval/067_fruit_distribution/fruit_distribution.prompt similarity index 100% rename from benches/HumanEval/67_fruit_distribution/fruit_distribution.prompt rename to benches/HumanEval/067_fruit_distribution/fruit_distribution.prompt diff --git a/benches/HumanEval/67_fruit_distribution/fruit_distribution.py b/benches/HumanEval/067_fruit_distribution/fruit_distribution.py similarity index 100% rename from benches/HumanEval/67_fruit_distribution/fruit_distribution.py rename to benches/HumanEval/067_fruit_distribution/fruit_distribution.py diff --git a/benches/HumanEval/68_pluck/pluck.prompt b/benches/HumanEval/068_pluck/pluck.prompt similarity index 100% rename from benches/HumanEval/68_pluck/pluck.prompt rename to benches/HumanEval/068_pluck/pluck.prompt diff --git a/benches/HumanEval/68_pluck/pluck.py b/benches/HumanEval/068_pluck/pluck.py similarity index 100% rename from benches/HumanEval/68_pluck/pluck.py rename to benches/HumanEval/068_pluck/pluck.py diff --git a/benches/HumanEval/69_search/search.prompt b/benches/HumanEval/069_search/search.prompt similarity index 100% rename from benches/HumanEval/69_search/search.prompt rename to benches/HumanEval/069_search/search.prompt diff --git a/benches/HumanEval/69_search/search.py b/benches/HumanEval/069_search/search.py similarity index 100% rename from benches/HumanEval/69_search/search.py rename to benches/HumanEval/069_search/search.py diff --git a/benches/HumanEval/70_strange_sort_list/strange_sort_list.prompt b/benches/HumanEval/070_strange_sort_list/strange_sort_list.prompt similarity index 100% rename from benches/HumanEval/70_strange_sort_list/strange_sort_list.prompt rename to benches/HumanEval/070_strange_sort_list/strange_sort_list.prompt diff --git a/benches/HumanEval/70_strange_sort_list/strange_sort_list.py b/benches/HumanEval/070_strange_sort_list/strange_sort_list.py similarity index 100% rename from benches/HumanEval/70_strange_sort_list/strange_sort_list.py rename to benches/HumanEval/070_strange_sort_list/strange_sort_list.py diff --git a/benches/HumanEval/71_triangle_area/triangle_area.prompt b/benches/HumanEval/071_triangle_area/triangle_area.prompt similarity index 100% rename from benches/HumanEval/71_triangle_area/triangle_area.prompt rename to benches/HumanEval/071_triangle_area/triangle_area.prompt diff --git a/benches/HumanEval/71_triangle_area/triangle_area.py b/benches/HumanEval/071_triangle_area/triangle_area.py similarity index 100% rename from benches/HumanEval/71_triangle_area/triangle_area.py rename to benches/HumanEval/071_triangle_area/triangle_area.py diff --git a/benches/HumanEval/72_will_it_fly/will_it_fly.prompt b/benches/HumanEval/072_will_it_fly/will_it_fly.prompt similarity index 100% rename from benches/HumanEval/72_will_it_fly/will_it_fly.prompt rename to benches/HumanEval/072_will_it_fly/will_it_fly.prompt diff --git a/benches/HumanEval/72_will_it_fly/will_it_fly.py b/benches/HumanEval/072_will_it_fly/will_it_fly.py similarity index 100% rename from benches/HumanEval/72_will_it_fly/will_it_fly.py rename to benches/HumanEval/072_will_it_fly/will_it_fly.py diff --git a/benches/HumanEval/73_smallest_change/smallest_change.prompt b/benches/HumanEval/073_smallest_change/smallest_change.prompt similarity index 100% rename from benches/HumanEval/73_smallest_change/smallest_change.prompt rename to benches/HumanEval/073_smallest_change/smallest_change.prompt diff --git a/benches/HumanEval/73_smallest_change/smallest_change.py b/benches/HumanEval/073_smallest_change/smallest_change.py similarity index 100% rename from benches/HumanEval/73_smallest_change/smallest_change.py rename to benches/HumanEval/073_smallest_change/smallest_change.py diff --git a/benches/HumanEval/74_total_match/total_match.prompt b/benches/HumanEval/074_total_match/total_match.prompt similarity index 100% rename from benches/HumanEval/74_total_match/total_match.prompt rename to benches/HumanEval/074_total_match/total_match.prompt diff --git a/benches/HumanEval/74_total_match/total_match.py b/benches/HumanEval/074_total_match/total_match.py similarity index 100% rename from benches/HumanEval/74_total_match/total_match.py rename to benches/HumanEval/074_total_match/total_match.py diff --git a/benches/HumanEval/75_is_multiply_prime/is_multiply_prime.prompt b/benches/HumanEval/075_is_multiply_prime/is_multiply_prime.prompt similarity index 100% rename from benches/HumanEval/75_is_multiply_prime/is_multiply_prime.prompt rename to benches/HumanEval/075_is_multiply_prime/is_multiply_prime.prompt diff --git a/benches/HumanEval/75_is_multiply_prime/is_multiply_prime.py b/benches/HumanEval/075_is_multiply_prime/is_multiply_prime.py similarity index 100% rename from benches/HumanEval/75_is_multiply_prime/is_multiply_prime.py rename to benches/HumanEval/075_is_multiply_prime/is_multiply_prime.py diff --git a/benches/HumanEval/76_is_simple_power/is_simple_power.prompt b/benches/HumanEval/076_is_simple_power/is_simple_power.prompt similarity index 100% rename from benches/HumanEval/76_is_simple_power/is_simple_power.prompt rename to benches/HumanEval/076_is_simple_power/is_simple_power.prompt diff --git a/benches/HumanEval/76_is_simple_power/is_simple_power.py b/benches/HumanEval/076_is_simple_power/is_simple_power.py similarity index 100% rename from benches/HumanEval/76_is_simple_power/is_simple_power.py rename to benches/HumanEval/076_is_simple_power/is_simple_power.py diff --git a/benches/HumanEval/77_iscube/iscube.prompt b/benches/HumanEval/077_iscube/iscube.prompt similarity index 100% rename from benches/HumanEval/77_iscube/iscube.prompt rename to benches/HumanEval/077_iscube/iscube.prompt diff --git a/benches/HumanEval/77_iscube/iscube.py b/benches/HumanEval/077_iscube/iscube.py similarity index 100% rename from benches/HumanEval/77_iscube/iscube.py rename to benches/HumanEval/077_iscube/iscube.py diff --git a/benches/HumanEval/78_hex_key/hex_key.prompt b/benches/HumanEval/078_hex_key/hex_key.prompt similarity index 100% rename from benches/HumanEval/78_hex_key/hex_key.prompt rename to benches/HumanEval/078_hex_key/hex_key.prompt diff --git a/benches/HumanEval/78_hex_key/hex_key.py b/benches/HumanEval/078_hex_key/hex_key.py similarity index 100% rename from benches/HumanEval/78_hex_key/hex_key.py rename to benches/HumanEval/078_hex_key/hex_key.py diff --git a/benches/HumanEval/79_decimal_to_binary/decimal_to_binary.prompt b/benches/HumanEval/079_decimal_to_binary/decimal_to_binary.prompt similarity index 100% rename from benches/HumanEval/79_decimal_to_binary/decimal_to_binary.prompt rename to benches/HumanEval/079_decimal_to_binary/decimal_to_binary.prompt diff --git a/benches/HumanEval/79_decimal_to_binary/decimal_to_binary.py b/benches/HumanEval/079_decimal_to_binary/decimal_to_binary.py similarity index 100% rename from benches/HumanEval/79_decimal_to_binary/decimal_to_binary.py rename to benches/HumanEval/079_decimal_to_binary/decimal_to_binary.py diff --git a/benches/HumanEval/80_is_happy/is_happy.prompt b/benches/HumanEval/080_is_happy/is_happy.prompt similarity index 100% rename from benches/HumanEval/80_is_happy/is_happy.prompt rename to benches/HumanEval/080_is_happy/is_happy.prompt diff --git a/benches/HumanEval/80_is_happy/is_happy.py b/benches/HumanEval/080_is_happy/is_happy.py similarity index 100% rename from benches/HumanEval/80_is_happy/is_happy.py rename to benches/HumanEval/080_is_happy/is_happy.py diff --git a/benches/HumanEval/81_numerical_letter_grade/numerical_letter_grade.prompt b/benches/HumanEval/081_numerical_letter_grade/numerical_letter_grade.prompt similarity index 100% rename from benches/HumanEval/81_numerical_letter_grade/numerical_letter_grade.prompt rename to benches/HumanEval/081_numerical_letter_grade/numerical_letter_grade.prompt diff --git a/benches/HumanEval/81_numerical_letter_grade/numerical_letter_grade.py b/benches/HumanEval/081_numerical_letter_grade/numerical_letter_grade.py similarity index 100% rename from benches/HumanEval/81_numerical_letter_grade/numerical_letter_grade.py rename to benches/HumanEval/081_numerical_letter_grade/numerical_letter_grade.py diff --git a/benches/HumanEval/82_prime_length/prime_length.prompt b/benches/HumanEval/082_prime_length/prime_length.prompt similarity index 100% rename from benches/HumanEval/82_prime_length/prime_length.prompt rename to benches/HumanEval/082_prime_length/prime_length.prompt diff --git a/benches/HumanEval/82_prime_length/prime_length.py b/benches/HumanEval/082_prime_length/prime_length.py similarity index 100% rename from benches/HumanEval/82_prime_length/prime_length.py rename to benches/HumanEval/082_prime_length/prime_length.py diff --git a/benches/HumanEval/83_starts_one_ends/starts_one_ends.prompt b/benches/HumanEval/083_starts_one_ends/starts_one_ends.prompt similarity index 100% rename from benches/HumanEval/83_starts_one_ends/starts_one_ends.prompt rename to benches/HumanEval/083_starts_one_ends/starts_one_ends.prompt diff --git a/benches/HumanEval/83_starts_one_ends/starts_one_ends.py b/benches/HumanEval/083_starts_one_ends/starts_one_ends.py similarity index 100% rename from benches/HumanEval/83_starts_one_ends/starts_one_ends.py rename to benches/HumanEval/083_starts_one_ends/starts_one_ends.py diff --git a/benches/HumanEval/84_solve/solve.prompt b/benches/HumanEval/084_solve/solve.prompt similarity index 100% rename from benches/HumanEval/84_solve/solve.prompt rename to benches/HumanEval/084_solve/solve.prompt diff --git a/benches/HumanEval/84_solve/solve.py b/benches/HumanEval/084_solve/solve.py similarity index 100% rename from benches/HumanEval/84_solve/solve.py rename to benches/HumanEval/084_solve/solve.py diff --git a/benches/HumanEval/85_add/add.prompt b/benches/HumanEval/085_add/add.prompt similarity index 100% rename from benches/HumanEval/85_add/add.prompt rename to benches/HumanEval/085_add/add.prompt diff --git a/benches/HumanEval/85_add/add.py b/benches/HumanEval/085_add/add.py similarity index 100% rename from benches/HumanEval/85_add/add.py rename to benches/HumanEval/085_add/add.py diff --git a/benches/HumanEval/86_anti_shuffle/anti_shuffle.prompt b/benches/HumanEval/086_anti_shuffle/anti_shuffle.prompt similarity index 100% rename from benches/HumanEval/86_anti_shuffle/anti_shuffle.prompt rename to benches/HumanEval/086_anti_shuffle/anti_shuffle.prompt diff --git a/benches/HumanEval/86_anti_shuffle/anti_shuffle.py b/benches/HumanEval/086_anti_shuffle/anti_shuffle.py similarity index 100% rename from benches/HumanEval/86_anti_shuffle/anti_shuffle.py rename to benches/HumanEval/086_anti_shuffle/anti_shuffle.py diff --git a/benches/HumanEval/87_get_row/get_row.prompt b/benches/HumanEval/087_get_row/get_row.prompt similarity index 100% rename from benches/HumanEval/87_get_row/get_row.prompt rename to benches/HumanEval/087_get_row/get_row.prompt diff --git a/benches/HumanEval/87_get_row/get_row.py b/benches/HumanEval/087_get_row/get_row.py similarity index 100% rename from benches/HumanEval/87_get_row/get_row.py rename to benches/HumanEval/087_get_row/get_row.py diff --git a/benches/HumanEval/88_sort_array/sort_array.prompt b/benches/HumanEval/088_sort_array/sort_array.prompt similarity index 100% rename from benches/HumanEval/88_sort_array/sort_array.prompt rename to benches/HumanEval/088_sort_array/sort_array.prompt diff --git a/benches/HumanEval/88_sort_array/sort_array.py b/benches/HumanEval/088_sort_array/sort_array.py similarity index 100% rename from benches/HumanEval/88_sort_array/sort_array.py rename to benches/HumanEval/088_sort_array/sort_array.py diff --git a/benches/HumanEval/89_encrypt/encrypt.prompt b/benches/HumanEval/089_encrypt/encrypt.prompt similarity index 100% rename from benches/HumanEval/89_encrypt/encrypt.prompt rename to benches/HumanEval/089_encrypt/encrypt.prompt diff --git a/benches/HumanEval/89_encrypt/encrypt.py b/benches/HumanEval/089_encrypt/encrypt.py similarity index 100% rename from benches/HumanEval/89_encrypt/encrypt.py rename to benches/HumanEval/089_encrypt/encrypt.py diff --git a/benches/HumanEval/90_next_smallest/next_smallest.prompt b/benches/HumanEval/090_next_smallest/next_smallest.prompt similarity index 100% rename from benches/HumanEval/90_next_smallest/next_smallest.prompt rename to benches/HumanEval/090_next_smallest/next_smallest.prompt diff --git a/benches/HumanEval/90_next_smallest/next_smallest.py b/benches/HumanEval/090_next_smallest/next_smallest.py similarity index 100% rename from benches/HumanEval/90_next_smallest/next_smallest.py rename to benches/HumanEval/090_next_smallest/next_smallest.py diff --git a/benches/HumanEval/91_is_bored/is_bored.prompt b/benches/HumanEval/091_is_bored/is_bored.prompt similarity index 100% rename from benches/HumanEval/91_is_bored/is_bored.prompt rename to benches/HumanEval/091_is_bored/is_bored.prompt diff --git a/benches/HumanEval/91_is_bored/is_bored.py b/benches/HumanEval/091_is_bored/is_bored.py similarity index 100% rename from benches/HumanEval/91_is_bored/is_bored.py rename to benches/HumanEval/091_is_bored/is_bored.py diff --git a/benches/HumanEval/92_any_int/any_int.prompt b/benches/HumanEval/092_any_int/any_int.prompt similarity index 100% rename from benches/HumanEval/92_any_int/any_int.prompt rename to benches/HumanEval/092_any_int/any_int.prompt diff --git a/benches/HumanEval/92_any_int/any_int.py b/benches/HumanEval/092_any_int/any_int.py similarity index 100% rename from benches/HumanEval/92_any_int/any_int.py rename to benches/HumanEval/092_any_int/any_int.py diff --git a/benches/HumanEval/93_encode/encode.prompt b/benches/HumanEval/093_encode/encode.prompt similarity index 100% rename from benches/HumanEval/93_encode/encode.prompt rename to benches/HumanEval/093_encode/encode.prompt diff --git a/benches/HumanEval/93_encode/encode.py b/benches/HumanEval/093_encode/encode.py similarity index 100% rename from benches/HumanEval/93_encode/encode.py rename to benches/HumanEval/093_encode/encode.py diff --git a/benches/HumanEval/94_skjkasdkd/skjkasdkd.prompt b/benches/HumanEval/094_skjkasdkd/skjkasdkd.prompt similarity index 100% rename from benches/HumanEval/94_skjkasdkd/skjkasdkd.prompt rename to benches/HumanEval/094_skjkasdkd/skjkasdkd.prompt diff --git a/benches/HumanEval/94_skjkasdkd/skjkasdkd.py b/benches/HumanEval/094_skjkasdkd/skjkasdkd.py similarity index 100% rename from benches/HumanEval/94_skjkasdkd/skjkasdkd.py rename to benches/HumanEval/094_skjkasdkd/skjkasdkd.py diff --git a/benches/HumanEval/95_check_dict_case/check_dict_case.prompt b/benches/HumanEval/095_check_dict_case/check_dict_case.prompt similarity index 100% rename from benches/HumanEval/95_check_dict_case/check_dict_case.prompt rename to benches/HumanEval/095_check_dict_case/check_dict_case.prompt diff --git a/benches/HumanEval/95_check_dict_case/check_dict_case.py b/benches/HumanEval/095_check_dict_case/check_dict_case.py similarity index 100% rename from benches/HumanEval/95_check_dict_case/check_dict_case.py rename to benches/HumanEval/095_check_dict_case/check_dict_case.py diff --git a/benches/HumanEval/96_count_up_to/count_up_to.prompt b/benches/HumanEval/096_count_up_to/count_up_to.prompt similarity index 100% rename from benches/HumanEval/96_count_up_to/count_up_to.prompt rename to benches/HumanEval/096_count_up_to/count_up_to.prompt diff --git a/benches/HumanEval/96_count_up_to/count_up_to.py b/benches/HumanEval/096_count_up_to/count_up_to.py similarity index 100% rename from benches/HumanEval/96_count_up_to/count_up_to.py rename to benches/HumanEval/096_count_up_to/count_up_to.py diff --git a/benches/HumanEval/97_multiply/multiply.prompt b/benches/HumanEval/097_multiply/multiply.prompt similarity index 100% rename from benches/HumanEval/97_multiply/multiply.prompt rename to benches/HumanEval/097_multiply/multiply.prompt diff --git a/benches/HumanEval/97_multiply/multiply.py b/benches/HumanEval/097_multiply/multiply.py similarity index 100% rename from benches/HumanEval/97_multiply/multiply.py rename to benches/HumanEval/097_multiply/multiply.py diff --git a/benches/HumanEval/98_count_upper/count_upper.prompt b/benches/HumanEval/098_count_upper/count_upper.prompt similarity index 100% rename from benches/HumanEval/98_count_upper/count_upper.prompt rename to benches/HumanEval/098_count_upper/count_upper.prompt diff --git a/benches/HumanEval/98_count_upper/count_upper.py b/benches/HumanEval/098_count_upper/count_upper.py similarity index 100% rename from benches/HumanEval/98_count_upper/count_upper.py rename to benches/HumanEval/098_count_upper/count_upper.py diff --git a/benches/HumanEval/99_closest_integer/closest_integer.prompt b/benches/HumanEval/099_closest_integer/closest_integer.prompt similarity index 100% rename from benches/HumanEval/99_closest_integer/closest_integer.prompt rename to benches/HumanEval/099_closest_integer/closest_integer.prompt diff --git a/benches/HumanEval/99_closest_integer/closest_integer.py b/benches/HumanEval/099_closest_integer/closest_integer.py similarity index 100% rename from benches/HumanEval/99_closest_integer/closest_integer.py rename to benches/HumanEval/099_closest_integer/closest_integer.py