Spaces:

Hokin
/

spiral

Sleeping

File size: 8,971 Bytes

714a85e

import re
from pathlib import Path

import numpy as np

from maze_generator import *
from prompt_builder import *

def encode_maze(maze, encoding_type):
    if encoding_type == "matrix":
        return encode_standard_matrix_maze(maze)
    elif encoding_type == "coord_list":
        return encode_coordinate_list_maze(maze)
    elif encoding_type == "vision":
        return encode_standard_matrix_maze(maze)
    else:
        raise NotImplementedError

# RECOGNIZE 
def contains_word_case_insensitive(s, word_list):
    word_list = [re.escape(word) for word in word_list]
    pattern = r'\b(?:' + '|'.join(word_list) + r')\b'
    return re.search(pattern, s, re.IGNORECASE) is not None

def is_correct_recognize(response, shape):
    if shape == 'square':
        word_list = ['square', 'box', 'cube', 'symmetrical rectangle', 'right-angled quadrilateral', 'symmetric quadrilateral', "four-sided polygon"]
    elif shape == 'triangle':
        word_list = ['triangle', 'pyramid', 'trilateral', 'three-sided polygon', 'isosceles']
    elif shape == 'spiral':
        word_list = ['spiral', 'helix', 'coil', 'whorl', 'swirl', 'vortex']
    elif shape == 'cross':
        word_list = ['cross', 'times', 'multiplication', 'X', 'X-shape', 'crossed lines', 'crossing']
    elif shape == 'C':
        word_list = ['C', 'crescent', 'half-circle', 'curved line', 'semi-circle', 'semi circle', 'open curve']
    elif shape == 'Z':
        word_list = ['Z', 'zigzag', 'lightning bolt']

    return contains_word_case_insensitive(response, word_list)

# GENERATE

def is_correct_generate(response, encoding_type, size, shape, orig_maze):
    all_mazes = globals()[f"all_{shape}_path_mazes"](size)
    all_mazes_and_paths = []
    for maze in all_mazes:
        all_mazes_and_paths.extend(init_all_start_end(maze))
    all_maze_encodings = set()
    for maze in all_mazes_and_paths:
        all_maze_encodings.add(encode_maze(maze, encoding_type))
    
    all_maze_encodings.remove(encode_maze(orig_maze, encoding_type))

    for maze_encoding in all_maze_encodings:
        if maze_encoding in response:
            return True
    return False

def is_correct_solution(response, maze):
    # Find all coordinates that appear in the response.
    pattern = r'\(\s*(-?\d+)\s*,\s*(-?\d+)\s*\)'
    coordinates = re.findall(pattern, response)
    coordinates = [(int(x), int(y)) for x, y in coordinates]

    # As responses will usually talk about the solution before presenting
    # the final form, we will start from the last provided end point 
    # of the maze and work backwards until we arrive at the solution.
    start = tuple(np.argwhere(maze == POS)[0])
    end = tuple(np.argwhere(maze == END)[0])

    try:
        i = find_last_index(coordinates, end)
    except ValueError:
        return False

    while i > 0:
        curr_pos = coordinates[i]
        if curr_pos == start:
            return True
        next_pos = coordinates[i - 1]
        if next_pos in get_valid_moves(maze, curr_pos):
            i = i - 1
        else:
            break
    return False

def find_last_index(lst, element):
    return len(lst) - 1 - lst[::-1].index(element)

def get_valid_moves(maze, pos):
    x, y = pos
    rows = len(maze)
    cols = len(maze[0])
    
    # All 8 possible directions (up, down, left, right and diagonals)
    directions = [
        (-1, -1), (-1, 0), (-1, 1),
        (0, -1),         (0, 1),
        (1, -1), (1, 0), (1, 1) 
    ]

    valid_moves = []
    for dx, dy in directions:
        new_x, new_y = x + dx, y + dy
        
        # Check if the new coordinates are within bounds
        if 0 <= new_x < rows and 0 <= new_y < cols:
            if maze[new_x, new_y] != WALL:
                valid_moves.append((new_x, new_y))
    
    return valid_moves

def parse_coordinates(text):
    walls = re.findall(r"Walls: ([\d, ()]+)", text)
    empty = re.findall(r"Empty: ([\d, ()]+)", text)
    start = re.findall(r"Start: \((\d+, \d+)\)", text)
    end = re.findall(r"End: \((\d+, \d+)\)", text)

    walls = [tuple(map(int, coord.split(', '))) for coord in re.findall(r"\((\d+, \d+)\)", walls[0])]
    empty = [tuple(map(int, coord.split(', '))) for coord in re.findall(r"\((\d+, \d+)\)", empty[0])]
    start = tuple(map(int, start[0].split(', ')))
    end = tuple(map(int, end[0].split(', ')))

    return walls, empty, start, end

def parse_coordinate_maze(text, size):
    walls, empty, start, end = parse_coordinates(text)
    maze = np.full(size, -1)
    for x, y in walls:
        maze[x, y] = WALL
    for x, y in empty:
        maze[x, y] = PATH
    maze[start[0], start[1]] = POS
    maze[end[0], end[1]] = END
    return maze

def grade_prompts(version):
    parent_dir = Path(f"results/{version}/")
    for model in parent_dir.iterdir():
        grade_info = ""
        total = 0
        total_correct = 0
        total_size = {size_t.name: 0 for size_t in (parent_dir / model.name).iterdir() if not size_t.is_file()}
        total_size_correct = {size_t.name: 0 for size_t in (parent_dir / model.name).iterdir() if not size_t.is_file()}
        total_encoding = {"standard": 0, "unusual": 0, "coordinate": 0}
        total_encoding_correct = {"standard": 0, "unusual": 0, "coordinate": 0}
        total_shape = {shape: 0 for shape in SHAPES}
        total_shape_correct = {shape: 0 for shape in SHAPES}
        for size_t in (parent_dir / model.name).iterdir():
            if size_t.is_file():
                continue
            size = (int(size_t.name[0]), int(size_t.name[2]))
            for encoding in (parent_dir / model.name / size_t.name).iterdir():
                for shape in (parent_dir / model.name / size_t.name / encoding.name).iterdir():
                    for response_file in (parent_dir / model.name / size_t.name / encoding.name / shape.name).iterdir():
                        response_text = response_file.read_text()
                        # Get coordinate version of maze given in prompt so we can decode.
                        coord_prompt_text = Path(f"prompts/v1/diag/{size_t.name}/coordinate/{shape.name}/{response_file.name}").read_text()
                        maze = parse_coordinate_maze(coord_prompt_text, size)
                        is_correct = is_correct_solution(response_text, maze)

                        grade_info += f"{size_t.name}-{encoding.name}: {response_file.name}: {is_correct}\n"

                        total += 1
                        total_correct += is_correct
                        total_size[size_t.name] += 1
                        total_size_correct[size_t.name] += is_correct
                        total_encoding[encoding.name] += 1
                        total_encoding_correct[encoding.name] += is_correct
                        total_shape[shape.name] += 1
                        total_shape_correct[shape.name] += is_correct
        
        grade_info += "\n\n### SUMMARY ###\n"
        grade_info += f"Total: {total_correct}/{total}\n\n"
        grade_info += "Following show total correct for one variable across all others:\n"
        grade_info += "# SIZES #\n"
        for size, correct in total_size_correct.items():
            grade_info += f"{size}: {correct}/{total_size[size]}\n"
        grade_info += "# ENCODING #\n"
        for encoding, correct in total_encoding_correct.items():
            grade_info += f"{encoding}: {correct}/{total_encoding[encoding]}\n"
        grade_info += "# SHAPE #\n"
        for shape, correct in total_shape_correct.items():
            grade_info += f"{shape}: {correct}/{total_shape[shape]}\n"

        (parent_dir / model.name / "grade_info.txt").write_text(grade_info)

        print(f"{model.name} - total: {total_correct}/{total}")
        import csv

        # Define the path to the CSV file
        csv_path = parent_dir / model.name / "grade_info.csv"

        # Prepare the data for the CSV
        csv_data = [
            [model.name, "Total Correct", "Total"],
            ["Summary", total_correct, total],
        ]

        # Add size data to csv_data
        csv_data.append(["SIZES", "Correct", "Total"])
        for size, correct in total_size_correct.items():
            csv_data.append([size, correct, total_size[size]])

        # Add encoding data to csv_data
        csv_data.append(["ENCODING", "Correct", "Total"])
        for encoding, correct in total_encoding_correct.items():
            csv_data.append([encoding, correct, total_encoding[encoding]])

        # Add shape data to csv_data
        csv_data.append(["SHAPE", "Correct", "Total"])
        for shape, correct in total_shape_correct.items():
            csv_data.append([shape, correct, total_shape[shape]])

        # Write the csv_data to the CSV file
        with open(csv_path, mode='w', newline='') as file:
            writer = csv.writer(file)
            writer.writerows(csv_data)
        print(f"CSV file saved at {csv_path}")

if __name__ == "__main__":
    grade_prompts("only_one_per_folder")