Initial commit

2022-10-11 00:02:25 +02:00
commit 7e7f04f125
2 changed files with 553 additions and 0 deletions
--- a/challenge_evaluation.py
+++ b/challenge_evaluation.py
@ -0,0 +1,276 @@
 import argparse
 import zipfile
 import json
 import os
 # Costs
 CONSTANT_COST = 1
 REGISTER_COST = 1
 OP_COST = {
    "SUB": 4,
    "ADD": 4,
    "INC": 4,
    "DEC": 4,
    "MUL": 10,
    "DIV": 10,
    "MOD": 10,
    "OR": 8,
    "AND": 8,
    "XOR": 8,
    "INV": 8,
    "SL": 5,
    "SR": 5,
    "SLU": 5,
    "SRU": 5,
    "ROTL": 7,
    "ROTR": 7,
 }
 ALG_LINE_COST = 0.5
 # ansi escape codes
 ul = "\033[4m"  # underline
 end = "\033[0m"  # reset
 ylw = "\033[33m"  # yellow
 def is_empty_row(row, pedantic=False):
    # Check if signal table is non-empty
    if "signal" in row and len(row["signal"]) != 0:
        return False
    # Only check if keys are set if pedantic is true
    if not pedantic:
        return True
    # Check if "unconditional-jump", "conditional-jump" or "label" is set
    keys = ("unconditional-jump", "conditional-jump", "label")
    return not any(key in row for key in keys)
 def evaluate(filepath, verbose=False, pedantic=False):
    filename = filepath.split(os.path.sep)[-1]
    if not filepath.endswith(".zip"):
        print(
            f"{filename} :: Supplied file does not have .zip file extension. Skipping .."
        )
        return -1
    with zipfile.ZipFile(filepath, "r") as savefile:
        with savefile.open("machine.json", "r") as machinefile, savefile.open(
            "signal.json", "r"
        ) as signalfile:
            machine = json.load(machinefile)
            signal = json.load(signalfile)
    # Load lines of code (rows)
    total_rows = signal["signaltable"]["row"]
    # Remove rows without effect (used for formatting for example)
    rows = [row for row in total_rows if not is_empty_row(row, pedantic=pedantic)]
    if verbose:
        print(f"{filename} :: Total number of rows: {len(total_rows)}")
        print(f"{filename} :: Number of rows after excluding empty: {len(rows)}")
    # Check if IR or PC register was used
    pc_used = any(
        (
            signal["name"] == "PC.W" and signal["value"] == "1"
            for row in rows
            for signal in row["signal"]
        )
    )
    ir_used = any(
        (
            signal["name"] == "IR.W" and signal["value"] == "1"
            for row in rows
            for signal in row["signal"]
        )
    )
    if verbose:
        if pc_used:
            print(f"{filename} :: PC Register was used in signal table row.")
        if ir_used:
            print(f"{filename} :: IR Register was used in signal table row.")
    # Load used multiplexer constants
    try:
        mux_input_a = next(
            filter(lambda mux: mux["muxType"] == "A", machine["machine"]["muxInputs"])
        )["input"]
        mux_consts_a = [
            int(mux_input["value"])
            for mux_input in mux_input_a
            if mux_input["type"] == "constant"
        ]
    except StopIteration:
        print(
            f"{filename} :: Couldn't find input for multiplexer A. Is the file corrupted? Skipping file .."
        )
        return -1
    try:
        mux_input_b = next(
            filter(lambda mux: mux["muxType"] == "B", machine["machine"]["muxInputs"])
        )["input"]
        mux_consts_b = [
            int(mux_input["value"])
            for mux_input in mux_input_b
            if mux_input["type"] == "constant"
        ]
    except StopIteration:
        print(
            f"{filename} :: Couldn't find input for multiplexer B. Is the file corrupted? Skipping file .."
        )
        return -1
    # Base machine has constants 0 and 1 at multiplexer A. All other constants are extensions.
    base_muxt_a = (0, 1)
    for base_input in base_muxt_a:
        try:
            mux_consts_a.remove(base_input)
        except ValueError:
            pass
    constants = set(mux_consts_a + mux_consts_b)
    if verbose:
        print(
            f"{filename} :: Found {len(mux_consts_a)} constants for multiplexer A: {mux_consts_a}"
        )
        print(
            f"{filename} :: Found {len(mux_consts_b)} constants for multiplexer B: {mux_consts_b}"
        )
        print(
            f"{filename} :: Found {len(constants)} total unique constants: [{', '.join([str(c) for c in constants])}]"
        )
    # Load used registers
    registers = machine["machine"]["registers"]["register"]
    registers = [register["name"] for register in registers]
    if pc_used:
        registers.append("PC_ALT")
    if ir_used:
        registers.append("IR_ALT")
    if verbose:
        print(f"{filename} :: Found {len(registers)} additional registers: {registers}")
    # Load used operations
    operations = machine["machine"]["alu"]["operation"]
    base_operations = ("A_ADD_B", "B_SUB_A", "TRANS_A", "TRANS_B")
    for base_op in base_operations:
        try:
            operations.remove(base_op)
        except ValueError:
            pass
    # Extract operation (remove operands)
    def get_op(op_str):
        return next(filter(lambda substr: substr not in ("A", "B"), op_str.split("_")))
    operations = list(map(get_op, operations))
    if verbose:
        print(
            f"{filename} :: Found {len(operations)} additional operations: {operations}"
        )
    # Sum points
    alg_line_costs = len(rows) * ALG_LINE_COST  # every line of code
    constant_costs = len(constants) * CONSTANT_COST  # constants at both multiplexers
    register_costs = len(registers) * REGISTER_COST  # registers
    operation_costs = 0
    for operation in operations:  # operations
        operation_costs += OP_COST[operation]
    total = alg_line_costs + constant_costs + register_costs + operation_costs
    # Summarize
    costs = (alg_line_costs, constant_costs, register_costs, operation_costs, total)
    precision = max(
        [len(str(float(cost)).split(".")[1].lstrip("0")) for cost in costs]
    )  # unreadable but works ¯\_(ツ)_/¯
    if verbose:
        print("")
    print(f"{ul}Summary for {filename}:{end}\n")
    print(f"   {alg_line_costs:5.{min(precision, 2)}f} LINES (excluding empty lines)")
    print(f"+  {constant_costs:5.{min(precision, 2)}f} CONSTANTS")
    print(f"+  {register_costs:5.{min(precision, 2)}f} REGISTERS")
    print(f"+  {operation_costs:5.{min(precision, 2)}f} OPERATIONS")
    print(f"-------------")
    print(f"=  {ylw}{total:5.{min(precision, 2)}f} TOTAL{end}\n\n")
    return total
 # Evaluation
 if __name__ == "__main__":
    parser = argparse.ArgumentParser()
    parser.add_argument(
        "source",
        type=str,
        nargs="+",
        help="Either ZIP file(s) generated by simulator or the submission root folder",
    )
    parser.add_argument(
        "-v",
        "--verbose",
        dest="verbose",
        action="store_true",
        help="Prints additional information.",
    )
    parser.add_argument(
        "-p",
        "--pedantic",
        dest="pedantic",
        action="store_true",
        help="Extra pedantic (for example when checking for empty lines)",
    )
    parser.add_argument(
        "-t",
        "--top",
        dest="top",
        type=int,
        help="Print top n candidates (defaults to 7)",
    )
    args = parser.parse_args()
    verbose = args.verbose
    pedantic = args.pedantic
    top_n = args.top if args.top != None else 7
    # output score for each file
    scores = []
    # check if source argument is folder
    savefiles = []
    for source in args.source:
        if os.path.isdir(source):
            # add all zip from subdirectories
            for d in [
                e for e in os.listdir(source) if os.path.isdir(os.path.join(source, e))
            ]:
                savefiles.append(os.path.join(source, d, f"{d}.zip"))
        elif source.endswith(".zip"):
            savefiles.append(source)
        else:
            print(f"Source '{source}' is not a ZIP file.")
    for savefile in savefiles:
        score = evaluate(savefile, verbose=verbose, pedantic=pedantic)
        if score == -1:
            continue
        scores.append([savefile, score])
    # if there is more than one file, output top 3
    scores.sort(key=lambda x: x[1])
    n = len(savefiles)
    if n > 1:
        print(f"{ul}Leaderboard:{end}")
        for i in range(min(n, top_n)):
            file, score = scores[i]
            print(f"#{i + 1} - {ylw}{score:5.2f} TOTAL{end} - {file}")
--- a/machine_evaluation.py
+++ b/machine_evaluation.py
@ -0,0 +1,277 @@
 import argparse
 import json
 import math
 import sys
 import os
 import subprocess
 from zipfile import ZipFile
 """
    Checks if all submission output the correct decrypted data.
    Directory structure should be as follows:
    submissions
    ├── <team1>
    |   ├── mem_layout.json [optional]
    |   └── <savename>.zip
    ├── <team2>
    |   ├── mem_layout.json [optional]
    |   └── <savename>.zip
    ...
    group
    ├── sBox
    ├── key
    ├── data_encrypted
    └── data_decrypted
    mem_layout.json must contain the keys 'sbox', 'key' and 'data', with the respective addresses as values.
    If the file does not exist, the user will be prompted to enter these addresses. The data
    will then be saved as 'mem_layout.json', to be used in subsequent calls.
    If more than one simulator ZIP file is present, the user will also be prompted to choose.
 """
 SIMULATOR_PATH = "./minimax_simulator-2.0.0-cli.jar"
 # helper strings
 OK = "\033[32mOK\033[0m"
 ERROR = "\033[31mERROR\033[0m"
 def compare_result(actual_file: str, expected_file: str) -> bool:
    """
    Compares the file at path 'actual_file' with the file at path 'expected_file' bytewise.
    If the actual file is larger than the expected file, additional bytes will be ignored.
    """
    with open(actual_file, "rb") as actual, open(expected_file, "rb") as expected:
        actual_bytes = actual.read()
        expected_bytes = expected.read()
    return actual_bytes[: len(expected_bytes)] == expected_bytes
 def create_mem_layout() -> dict:
    """
    Prompts the user to enter addresses for the sbox, key and data.
    Returns a dictionary with these three keys.
    """
    mem_layout = dict()
    for key in ("sbox", "key", "data"):
        while True:
            try:
                value = input(f"{key} address (prefix hex numbers with '0x'):   ")
                base = 16 if value.startswith("0x") else 10
                value = int(value, base=base)
                break
            except ValueError:
                print("Adress is not an integer.")
            except KeyboardInterrupt:
                sys.exit("Aborted.")
        mem_layout[key] = value
    return mem_layout
 def is_valid_zip(file: str) -> bool:
    """
    Checks if a zip file is a save file from the minimax simulator, e.g. if the contents
    are a 'machine.json' and 'signal.json' file.
    """
    if not file.endswith(".zip"):
        return False
    with ZipFile(file) as machine_zip:
        zip_content = machine_zip.namelist()
    return set(zip_content) == set(("machine.json", "signal.json"))
 def select_zip(zips: list) -> str:
    """
    Prompts the user to select a single zip file from a list, and returns it.
    """
    print("Multiple zip files found. Please select one:")
    for index, f in enumerate(zips, start=1):
        print(f"[{index}] {f}")
    while True:
        try:
            selection = input("Enter the number of the zip file to select:    ")
            selection = int(selection) - 1
            if selection <= 0 or selection > len(zips):
                print(f"Please select a number between 1 and {len(zips)}.")
            else:
                return zips[selection]
        except ValueError:
            print("Please enter a valid integer.")
        except KeyboardInterrupt:
            sys.exit("Aborted")
 def evaluate(
    zip_file: str,
    sbox_file: str,
    key_file: str,
    data_file: str,
    result_file: str,
    mem_layout: dict,
    simulator: str,
 ) -> None:
    """
    Runs the minimax simulator on the given input. The resulting file is saved in 'result_file'.
    """
    args = [
        "java",
        "-jar",
        simulator,
        zip_file,
        "--import-file",
        sbox_file,
        "--import-from",
        mem_layout["sbox"],
        "--import-file",
        key_file,
        "--import-from",
        mem_layout["key"],
        "--import-file",
        data_file,
        "--import-from",
        mem_layout["data"],
        "--export-file",
        result_file,
        "--export-from",
        mem_layout["data"],
        "--export-to",
        mem_layout["data"] + math.ceil(os.path.getsize(data_file)),
    ]
    args = [
        str(arg) for arg in args
    ]  # subprocess.run requires all arguments to be strings
    print(f"Running simulator, storing result in '{result_file}'")
    result = subprocess.run(args, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
    print("\033[38;5;245m")
    print(result.stdout.decode("utf-8"))
    print("\033[38;5;124")
    print(result.stderr.decode("utf-8"))
    print("\033[0m")
 if __name__ == "__main__":  # only run if executed as script
    parser = argparse.ArgumentParser()
    parser.add_argument("submissions", type=str, help="Submissions root directory")
    parser.add_argument(
        "group", type=str, help="Group directory, contains all project files"
    )
    parser.add_argument(
        "-e",
        "--file-extension",
        dest="file_ext",
        type=str,
        help="Result file extension",
    )
    parser.add_argument("-j", "--jar", dest="jar", type=str, help="Simulator jar file")
    args = parser.parse_args()
    # Load teams
    teams = [
        e
        for e in os.listdir(args.submissions)
        if os.path.isdir(os.path.join(args.submissions, e))
    ]
    print(f"The following teams were found:")
    for team in teams:
        print(f"* {team}")
    # Check directory structure
    for file in ("sBox", "key", "data_encrypted", "data_decrypted"):
        if not os.path.exists(os.path.join(args.group, file)):
            sys.exit(f"Group project file '{file}' is missing.")
    # Check file extension
    if args.file_ext is None:
        args.file_ext = ""
    elif not args.file_ext.startswith("."):
        args.file_ext = f".{args.file_ext}"
    # Update simulator path if given
    simulator = SIMULATOR_PATH if args.jar is None else args.jar
    # Store evaluation results
    expected_file = os.path.join(args.group, "data_decrypted")
    results = []
    # Evaluate each team
    for team in teams:
        # load memory layout file if available (otherwise create and store it)
        try:
            with open(
                os.path.join(args.submissions, team, "mem_layout.json"), "r"
            ) as mem_layout_file:
                mem_layout = json.load(mem_layout_file)
        except FileNotFoundError:
            mem_layout = create_mem_layout()
            with open(
                os.path.join(args.submissions, team, "mem_layout.json"), "w"
            ) as mem_layout_file:
                json.dump(mem_layout, mem_layout_file)
        # Select project file (if more there is more than one zip file)
        zip_files = [
            os.path.join(args.submissions, team, f)
            for f in os.listdir(os.path.join(args.submissions, team))
            if is_valid_zip(os.path.join(args.submissions, team, f))
        ]
        zip_file = zip_files[0] if len(zip_files) == 1 else select_zip(zip_files)
        # check memory layout and convert hexadecimal addresses
        for key in ("sbox", "key", "data"):
            if key not in mem_layout:
                sys.exit(f"memory_layout does not contain key '{key}'")
            try:
                addr = int(mem_layout[key])
            except ValueError:
                try:
                    addr = int(mem_layout[key], base=16)
                except ValueError:
                    sys.exit(f"Invalid address '{mem_layout[key]}' for key '{key}'")
            mem_layout[key] = addr
        # evaluate team
        sbox_file = os.path.join(args.group, "sBox")
        key_file = os.path.join(args.group, "key")
        data_file = os.path.join(args.group, "data_encrypted")
        result_file = os.path.join(
            args.submissions, team, f"data_decrypted{args.file_ext}"
        )
        evaluate(
            zip_file,
            sbox_file,
            key_file,
            data_file,
            result_file,
            mem_layout,
            simulator=simulator,
        )
        # Compare against expected result
        results.append(compare_result(result_file, expected_file))
    # Print result summary
    print("Summary:")
    for team, result in zip(teams, results):
        if result is True:
            print(f"[{OK}]    - {team}")
        else:
            print(f"[{ERROR}] - {team}")
    print()