core.py

import math
import time
import sys
import numpy as np
from collections import namedtuple, defaultdict
from queue import PriorityQueue
import pickle

# import minihack
import nle.nethack as nh

np.set_printoptions(threshold=sys.maxsize)


class Saver:
    def __init__(self, obs_keys, filename):
        self.trajectory = defaultdict(list)
        self.filename = filename
        self.obs_keys = obs_keys

    def save_obs_and_action(self, observation, action):
        for k in self.obs_keys:
            self.trajectory[k].append(observation[k])
        self.trajectory['actions'].append(action)

    def save_to_file(self):
        with open(self.filename+'.pkl', 'wb') as fp:
            pickle.dump(self.trajectory, fp)

        print(f'Trajectory saved to {self.filename}')


Inventory = namedtuple('Inventory', 'letters classes glyphs descs')
BLStats = namedtuple('BLStats', 'x y strength_percentage strength dexterity constitution intelligence wisdom charisma score hitpoints max_hitpoints depth gold energy max_energy armor_class monster_level experience_level experience_points time hunger_state carrying_capacity dungeon_number level_number prop_mask align')

class GameWhisperer:

    def __init__(self, env, fast_mode, saver, filename):
        try:
            from game_items.item_manager_sk import Item_manager_sk
            self.item_manager = Item_manager_sk('game_items/objects.pl')
        except Exception:
            print("pyswip or prolog is not present, in-game item management is disabled")
        self.env = env
        self.a_yx = [-1, -1]
        self.walkable_glyphs = [(x, -1) for x in b'!"$%()*./<=>?[\\]`u'] + \
            [(x, 7) for x in b'#df'] + \
            [(x, 15) for x in b'#@df'] + \
            [(x, 3) for x in b'-|']
        self.size_y = 21
        self.size_x = 79
        self.current_obs = self.env.reset()
        self.glyph_obs = self.current_obs['glyphs']
        self.char_obs = self.current_obs['chars']
        self.color_obs = self.current_obs['colors']
        self.message = self.current_obs['message']
        self.update_inv()
        self.parsed_message = self.parse_message()
        if 'tty_chars' in self.current_obs.keys():
            self.all_obs = self.current_obs['tty_chars']
        self.bl_stats = BLStats(*self.current_obs['blstats'])
        self.memory = [[-1 for _ in range(self.size_x)] for _ in range(self.size_y)]
        self.exception = []
        self.search_map = [[0 for _ in range(self.size_x)] for _ in range(self.size_y)]
        self.risk_map = [[0 for _ in range(self.size_x)] for _ in range(self.size_y)]
        self.last_risk_update = 0
        self.act_num = 0
        self.score = 0
        self.total_score = 0
        self.cooldown = 100000
        self.default_search_max = 10
        self.default_hard_search_max = 10
        self.search_max = self.default_search_max
        self.hard_search_max = self.default_hard_search_max
        self.agent_id = -1
        self.update_agent()
        self.agent_id = self.glyph_obs[self.a_yx[0]][self.a_yx[1]]
        self.memory[self.a_yx[0]][self.a_yx[1]] = self.act_num
        self.safe_play = False
        self.strict_safe_play = False  # when the strategy provides for strict safety
        self.recently_ejected = False
        self.last_monster_searched = (-1, -1, 0)
        self.monster_exception = []
        self.engraved_tiles = []
        self.inedible = []
        self.recently_killed = []
        self.shop_tiles = []
        self.last_pray = -1
        self.old_turn = 0
        self.new_turn = 0
        self.panic = False
        self.pet_alive = False
        self.pet_alive_turn = 0
        self.ran = False
        self.ran_turn = 0
        self.ran_cooldown = 2
        self.guard_encounter = 0
        self.u_stairs_locations = []
        self.d_stairs_locations = []
        self.tactical_descent = 0
        self.fast_mode = fast_mode
        self.stuck_counter = 0
        self.hard_search_num = 0
        self.elbereth_violated = 0
        self.depth_turns = {}
        self.saver = saver
        # if not self.fast_mode:
        # env.render()

    def calculate_risk(self, y, x):
        """
            function that calculates the risk value of a set of tiles
            given the location of a hazard.

            +1 +1 +1 +1 +1
            +1 +2 +2 +2 +1
            +1 +2 +3 +2 +1  hazard on the center
            +1 +2 +2 +2 +1
            +1 +1 +1 +1 +1

            :param y: dangerous tile y/vertical value
            :param x: dangerous tile x/horizontal value
        """

        touched = []
        layer = self.neighbors_8_dir(y, x)
        self.risk_map[y][x] += 2
        for tile in layer:
            self.risk_map[tile[0]][tile[1]] += 2
            touched.append((tile[0], tile[1]))

        for tile in layer:
            second_layer = self.neighbors_8_dir(tile[0], tile[1])
            for s_tile in second_layer:
                if not touched.__contains__((s_tile[0], s_tile[1])):
                    self.risk_map[s_tile[0]][s_tile[1]] += 1
                    touched.append((s_tile[0], s_tile[1]))

    def update_riskmap(self):
        """
            function that calculates the risk value of every tile
        """

        self.risk_map = [[0 for _ in range(self.size_x)] for _ in range(self.size_y)]

        for y in range(self.size_y):
            for x in range(self.size_x):
                if self.is_a_monster(y, x):
                    self.calculate_risk(y, x)

    def update_inv(self):
        self.inv_obs = Inventory(
                self.current_obs['inv_letters'],
                self.current_obs['inv_oclasses'],
                self.current_obs['inv_glyphs'],
                self.current_obs['inv_strs'])

    def update_obs(self):
        """
            function that update every possible version of the observation space
        """

        self.glyph_obs = self.current_obs['glyphs']
        self.char_obs = self.current_obs['chars']
        self.color_obs = self.current_obs['colors']
        self.message = self.current_obs['message']
        self.update_inv()
        self.parsed_message = self.parse_message()
        self.bl_stats = BLStats(*self.current_obs['blstats'])
        if 'tty_chars' in self.current_obs.keys():
            self.all_obs = self.current_obs['tty_chars']
        if self.last_risk_update != self.bl_stats.time:
            self.update_riskmap()
            self.last_risk_update = self.bl_stats.time

    def crop_printer(self, obs):
        """
            debug function that print a cropped (on the agent)
            version of a given observation space

            :param obs: given observation space
        """

        for i in range(-2, 3):
            print("   ".join(str(obs[self.a_yx[0] + i][self.a_yx[1] + j]) for j in range(-2,3)))

    def debug_crop(self):
        """
            debug function that print a cropped (on the agent)
            version of every observation space
        """

        self.crop_printer(self.char_obs)
        self.crop_printer(self.color_obs)
        self.crop_printer(self.glyph_obs)
        print(self.exception)

    def glyph_cooldown(self, glyph):
        """
            function that calculates the cooldown for taking
            into account a given glyph

            :param glyph: given glyph
        """

        if self.recently_ejected:
            self.recently_ejected = False
            return -1
        char = glyph[0]
        color = glyph[1]
        cooldown = self.cooldown
        if char == 64 and color == 15:
            cooldown = -1
        elif char == 43 and color == 3:
            cooldown = 50
        elif char == 45 or char == 124 and color == 3:
            cooldown = 200
        elif char == 62 or char == 36 or char == 60:
            cooldown = 15
        elif char == 37:
            cooldown = 1
        elif [58, 59, 38, 44].__contains__(char) or 65 <= char <= 90 or 97 <= char <= 122:
            cooldown = 5
        return cooldown

    def find(self, condition, args):
        """
            function for searching the closest tile which satisfies a given condition
            starting from the agent position

            :param condition: condition function to consider
            :param args: arguments for the given condition
        """

        frontier = list()
        looked_mat = [[0 for _ in range(self.size_x)] for _ in range(self.size_y)]
        current = (self.a_yx[0], self.a_yx[1])
        found = False

        while current is not None and not found:
            looked_mat[current[0]][current[1]] = 1

            if condition(current, args):
                return True, current[0], current[1]

            nbh = self.neighbors_8_dir(current[0], current[1])

            for next_tile in nbh:
                if looked_mat[next_tile[0]][next_tile[1]] == 0 and not frontier.__contains__(next_tile):
                    frontier.append(next_tile)
            if len(frontier) > 0:
                current = frontier.pop(0)
            else:
                current = None

        return False, -1, -1

    def find_far(self, condition):
        """
            function for searching the farest tile which satisfies a given condition

            :param condition: condition function to consider
        """

        frontier = list()
        looked_mat = [[0 for _ in range(self.size_x)] for _ in range(self.size_y)]
        current = (self.a_yx[0], self.a_yx[1])

        best = None

        while current is not None:
            looked_mat[current[0]][current[1]] = 1

            if condition(current[0], current[1]):
                best = current

            nbh = self.neighbors_8_dir(current[0], current[1])

            for next_tile in nbh:
                if looked_mat[next_tile[0]][next_tile[1]] == 0 and next_tile not in frontier:
                    frontier.append(next_tile)
            if len(frontier) > 0:
                current = frontier.pop(0)
            else:
                current = None

        if best is not None:
            return True, best[0], best[1]
        else:
            return False, -1, -1

    def condition_agent_obj(self, tile, args):
        """
            condition function for searching the agent on the map

            :param tile: tile to verify
            :param args: arguments for the given condition
            :return TRUE -> if condition is verified, FALSE -> elsewise
        """

        if args.__contains__((self.char_obs[tile[0]][tile[1]], self.color_obs[tile[0]][tile[1]])) and \
                (self.memory[tile[0]][tile[1]] == -1 or
                 abs(self.memory[tile[0]][tile[1]] - self.act_num) > self.glyph_cooldown(
                            (self.char_obs[tile[0]][tile[1]], self.color_obs[tile[0]][tile[1]]))) \
                and (self.agent_id == self.glyph_obs[tile[0]][tile[1]] or self.agent_id == -1):
            return True
        else:
            return False

    def update_agent(self):
        """
            function for updating the known agent's position
        """

        found_agent, self.a_yx[0], self.a_yx[1] = self.find(self.condition_agent_obj, [(64, 15)])
        return found_agent

    def hard_search(self):
        """
            function to set the "hard search", iteratively decreasing
            the number of total searches allowed per tile, after resetting the searchmap
        """

        self.search_map = [[0 for _ in range(self.size_x)] for _ in range(self.size_y)]
        self.search_max = self.hard_search_max
        self.hard_search_max -= 1

    def reset_memory(self):
        """
            function that resets the agent's knowledge of the game world
        """

        self.exception = []
        self.monster_exception = []
        self.search_max = self.default_search_max
        self.hard_search_max = self.default_hard_search_max
        self.memory = [[-1 for _ in range(self.size_x)] for _ in range(self.size_y)]
        self.search_map = [[0 for _ in range(self.size_x)] for _ in range(self.size_y)]

    def unexplored_walkable_around(self, y, x):
        """
            function that checks for the presence of
            never visited and walkable tiles around the agent

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: TRUE -> if exist a near walkable and unexplored tile, FALSE -> elsewise
        """

        walkable = 0
        unex_walkable = 0
        door_flag = False
        for i in self.neighbors_8_dir(y, x):
            if self.is_doorway(i[0], i[1]):
                door_flag = True
            if self.char_obs[i[0]][i[1]] == 43 or self.char_obs[i[0]][i[1]] == 96:
                return True
            if self.is_a_monster(i[0], i[1]):
                return True
            if self.is_walkable(i[0], i[1]):
                walkable += 1
            if self.is_walkable(i[0], i[1]) and self.is_unexplored(i[0], i[1]):
                unex_walkable += 1

        if door_flag and walkable == 1 and unex_walkable == 0:
            return False
        if door_flag:
            return True
        if walkable >= 3 or unex_walkable >= 1:
            return True

        return False

    def is_unexplored(self, y, x):
        """
            function that checks if a given tile is unexplored

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: TRUE -> if given tile is unexplored, FALSE -> elsewise
        """

        if self.memory[y][x] == -1 or abs(self.memory[y][x] - self.act_num) >= self.cooldown:
            return True
        else:
            return False

    def is_walkable(self, y, x):
        """
            function that checks if a given tile is walkable

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: TRUE -> if given tile is walkable, FALSE -> elsewise
        """

        char = self.char_obs[y][x]
        color = self.color_obs[y][x]

        if char == 64 and (y != self.a_yx[0] or x != self.a_yx[1]):
            return False

        if self.shop_tiles.__contains__((y, x)):
            return False

        if char == 101 and not self.panic:  # spore or eye
            return False
        elif char == 70 and color != 10 and color != 5 and not self.panic and self.bl_stats.hitpoints < 15:  # Molds
            return False
        # elif char == 98 and color == 2 and not self.panic:  # Acid Blob
        #    return False

        if char == 43 and color != 3:
            return True

        if (self.walkable_glyphs.__contains__((char, color)) or self.walkable_glyphs.__contains__(
                (char, -1))) and not self.exception.__contains__((y, x)):
            if char == 64 and (self.glyph_obs[y][x] != self.agent_id or color != 15):
                return False
            return True
        else:
            return False

    def is_a_monster(self, y, x):
        """
            function that checks if a given tile is a monster

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: TRUE -> if given tile is a monster, FALSE -> elsewise
        """

        char = self.char_obs[y][x]
        color = self.color_obs[y][x]

        if self.monster_exception.__contains__((y, x)):
            return False
        # if char == 104 and self.bl_stats.depth >= 3:
        # return False
        if char == ord('@') and color != 15:
            return True
        if char in b":;&'," or 65 <= char <= 90 or 97 <= char <= 122:
            #if self.is_pet(char, color)
            if (char in b"fd") and (
                    color == 7 or color == 15) and self.pet_alive:  # or (find and self.is_unexplored(y, x)):
                return False
            elif char == ord('u') and color == 3 and self.pet_alive:  # tamed pony is not a moster
                return False
            elif char == ord('e') and not self.panic and self.stuck_counter < 100:  # spore or eye
                return False
            elif char == ord('F') and color != 10 and color != 5 and not self.panic and self.bl_stats.hitpoints < 15:  # Molds
                return False
            # elif char == 98 and color == 2 and not self.panic:  # Acid Blob
            #    return False
            else:
                return True
        else:
            return False

    def is_passive_monster(self, y, x):
        """
            function that checks if a given tile is a passive monster

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: TRUE -> if given tile is a monster, FALSE -> elsewise
        """

        char = self.char_obs[y][x]
        color = self.color_obs[y][x]

        if char in b"bcePRF@":
            return True
        else:
            return False

    def is_safe(self, y, x):
        """
            function that checks if a given tile is safe (with zero risk)

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: TRUE -> if given tile is safe, FALSE -> elsewise
        """

        if self.risk_map[y][x] > 0:
            return False
        else:
            return True

    def is_unsearched_wallside(self, y, x):
        """
            function that checks if a given tile is near a wall
            and the agent never performed a search action there

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: TRUE -> if given tile is unsearched and wallside, FALSE -> elsewise
        """

        for (nhb_y, nhb_x) in self.neighbors_4_dir(y, x):
            if (self.char_obs[nhb_y][nhb_x] == 124 or self.char_obs[nhb_y][nhb_x] == 45) and \
                    self.color_obs[nhb_y][nhb_x] == 7 and self.search_map[nhb_y][nhb_x] == 0:
                return True
        return False

    def is_unsearched_voidside(self, y, x):
        """
            function that checks if a given tile is near a black unknown tile
            and the agent never performed a search action there

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: TRUE -> if given tile is unsearched and near an unknown tile, FALSE -> elsewise
        """

        for (nhb_y, nhb_x) in self.neighbors_4_dir(y, x):
            if self.char_obs[nhb_y][nhb_x] == 32 and self.search_map[nhb_y][nhb_x] == 0:
                return True
        return False

    def is_doorway(self, y, x):
        """
            function that checks if a given tile is a doorway looking for the glyph and also
            counting the walls around the tile

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: TRUE -> if given tile is a doorway, FALSE -> elsewise
        """

        char = self.char_obs[y][x]
        color = self.color_obs[y][x]
        if char in b'+|-' and color == 3:  # or (char == 46 and self.is_unexplored(y, x)): wip
            return True
        walls_count_h = 0
        walls_count_v = 0
        for (nhb_y, nhb_x) in self.neighbors_4_dir(y,x):
            if self.char_obs[nhb_y][nhb_x] in b"|-" and self.color_obs[nhb_y][nhb_x] == 7:
                if nhb_x == x:  # if vertically adjacent
                    walls_count_v += 1
                else:
                    walls_count_h += 1

        if walls_count_h == 2 or walls_count_v == 2:
            return True
        else:
            return False

    def is_isolated(self, y, x, glyph, cross):
        """
            function that checks if a given tile is isolated from
            other tiles of the same kind (or also near a doorway)

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: TRUE -> if given tile is isolated, FALSE -> elsewise
        """

        same_glyph_count = 0
        near = self.neighbors_8_dir(y, x)
        while len(near) > 0:
            next_tile = near.pop()
            if cross and next_tile[0] != y and next_tile[1] != x:
                continue
            if glyph is None:
                if self.glyph_obs[next_tile[0]][next_tile[1]] == self.glyph_obs[y][x] or self.is_doorway(next_tile[0], next_tile[1]):
                    same_glyph_count += 1
            else:
                char = glyph[0]
                color = glyph[1]
                if (self.char_obs[next_tile[0]][next_tile[1]] == char and self.color_obs[next_tile[0]][
                        next_tile[1]] == color) or self.is_doorway(next_tile[0], next_tile[1]):
                    same_glyph_count += 1
        if same_glyph_count < 2:
            return True
        else:
            return False

    def is_near_glyph(self, y, x, glyph, dir_num):
        """
            function that checks if a given tile is near
            a tile carrying a specific glyph

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :param glyph: specific glyph to be noticed
            :param dir_num: 4 or 8 directions to check
            :return: TRUE -> if given tile is near the given glyph, FALSE -> elsewise
        """

        char = glyph[0]
        color = glyph[1]
        around_it = []
        if dir_num == 8:
            around_it = self.neighbors_8_dir(y, x)
        if dir_num == 4:
            around_it = self.neighbors_4_dir(y, x)
        while len(around_it) > 0:
            near = around_it.pop()
            if self.char_obs[near[0]][near[1]] == char and (self.color_obs[near[0]][near[1]] == color or color == -1):
                return True
        return False

    def neighbors_8_dir(self, y, x):
        """
            function that return the 8-directions neighborhood of a given tile

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: a list containing the 8 tiles around the given one
        """

        neighborhood = self.neighbors_4_dir(y, x)

        if y > 0:
            if x > 0:
                neighborhood.append((y - 1, x - 1))  # nw
            if x < self.size_x - 1:
                neighborhood.append((y - 1, x + 1))  # ne
        if x < self.size_x - 1:
            if y < self.size_y - 1:
                neighborhood.append((y + 1, x + 1))  # se
        if y < self.size_y - 1:
            if x > 0:
                neighborhood.append((y + 1, x - 1))  # sw

        return neighborhood

    def neighbors_4_dir(self, y, x):
        """
            function that return the 4-directions (N,E,S,W) neighborhood of a given tile

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :return: a list containing the 4 tiles around the given one
        """

        neighborhood = list()
        if y > 0:
            neighborhood.append((y - 1, x))  # n
        if x < self.size_x - 1:
            neighborhood.append((y, x + 1))  # e
        if y < self.size_y - 1:
            neighborhood.append((y + 1, x))  # s
        if x > 0:
            neighborhood.append((y, x - 1))  # w
        return neighborhood

    def neighbors(self, y, x, safe):
        """
            function that returns the list of correctly reachable tiles
            (considering walkable tiles without entering the doors diagonally)
            starting from a given tile, avoiding dangerous tiles in case the "safe" flag is active

            :param y: tile y/vertical coordinate
            :param x: tile x/horiziontal coordinate
            :param safe: flag that determines the consideration of dangerous tiles
            :return: a list containing the tiles around the given one
        """

        neighborhood = list()
        doorway = self.is_doorway(y, x)
        for (nhb_y, nhb_x) in self.neighbors_8_dir(y,x):
            if self.is_walkable(nhb_y, nhb_x) and (not safe or self.is_safe(nhb_y, nhb_x)) and \
               (nhb_x == x or nhb_y == y or not (doorway or self.is_doorway(nhb_y, nhb_x))): #not diagonally adjacent or no doors in the way
                neighborhood.append((nhb_y, nhb_x))
        return neighborhood

    def parse_message(self):
        """
            function that parse the in game message form the NLE observation

            :return: a string containing the parsed message
        """
        return bytes(self.message).decode().strip('\0')

    def parse_all(self):
        """
            function that parse the complete observation returning a readable form of it

            :return: a string containing the parsed observation state
        """

        parsed_string = ""
        for i in range(0, 24):
            for j in range(0, 80):
                c = self.all_obs[i][j]
                parsed_string = parsed_string + chr(c)
        return parsed_string

    def type_text(self, text):
        for k in text:
            self.current_obs, rew, done, info = self.env.step(nh.ACTIONS.index(ord(k)))
        return rew, done, info


    # new version, tested
    def do_it(self, action, action_iterable=None):
        """
            function for sending input to the game terminal.
            It offers the management of specific cases, automating some actions.
            :param action: action to be performed. Must be a character or an action in nle.nethack.ACTIONS
            :param action_iterable: optional iterable useful when other actions have to be performed
            :return: the "reward" value (1 if episode success, 0 elsewise),
                     the "done" value (TRUE if the episode endend, FALSE elsewise),
                     the "info" object containg extra information (Gym standard implementation)
        """

        # print(self.bl_stats)
        self.old_turn = self.bl_stats.time
        rew = 0
        done = False
        info = None

        if self.update_agent():
            self.current_obs, rew, done, info = self.env.step(38)
            self.update_obs()

            # observations.append(numpy.concatenate((game.current_obs['chars'], game.current_obs['colors']), axis=None))

        def to_action_index(action):
            if isinstance(action, str):
                assert len(action) == 1, action
                action = ord(action)
            return nh.ACTIONS.index(action)

        rew, done, info = self.single_step(to_action_index(action))
        if action_iterable:
            for a in action_iterable:
                rew, done, info = self.single_step(to_action_index(a))
        return rew, done, info

    def single_step(self, action_index):
        """
            function for sending a single input to the game terminal.
            It offers the management of specific cases, automating some actions.
            :param action_index: action to be performed. Must be the index of the action in nle.nethack.ACTION
            :return: the "reward" value (1 if episode success, 0 elsewise),
                     the "done" value (TRUE if the episode endend, FALSE elsewise),
                     the "info" object containg extra information (Gym standard implementation)
        """
        rew = 0
        done = False
        info = None
        if not self.fast_mode:
            print("pray_timeout: ", abs(self.last_pray - self.bl_stats.time))
        if self.bl_stats.time % 100 == 0:
            print("current score: ", self.bl_stats.score, " turn: ",
                  self.bl_stats.time, " time: ", time.localtime()[3], ":", time.localtime()[4], "  -")
            go_back(2)

        if abs(self.bl_stats.time - self.pet_alive_turn) > 10 and self.bl_stats.time > 2000:
            self.pet_alive = False

        if self.act_num % 50 == 0:  # modifica
            self.panic = False

        if self.ran:
            if abs(self.ran_turn - self.bl_stats.time) > self.ran_cooldown:
                self.ran = False

        if self.score < self.bl_stats.score:
            self.score = self.bl_stats.score

        if self.parsed_message.__contains__("Hello stranger, who are you?"):  # respond Croesus
            self.guard_encounter += 1
            return -1, True, None
        '''
        if self.update_agent():
            self.current_obs, rew, done, info = self.env.step(38)
        self.update_obs()
        '''

        if self.update_agent():
            self.current_obs, rew, done, info = self.env.step(action_index)
        self.update_obs()

        if "swap" in self.parsed_message:
            self.pet_alive = True
            self.pet_alive_turn = self.bl_stats.time

        if self.parsed_message.__contains__("Are you sure you want to pray?") or self.parsed_message.__contains__(
                "Really attack"):
            self.type_text("y")
        if self.parsed_message.__contains__("You are carrying too much to get through."):
            next_tile = self.inverse_move_translator(self.a_yx[0], self.a_yx[1], action_index)
            self.exception.append(next_tile)
            self.update_obs()

        if self.parsed_message.__contains__("Closed for inventory"):
            for ty, tx in self.neighbors_4_dir(self.a_yx[0], self.a_yx[1]):
                if self.char_obs[ty][tx] == ord('+') and self.color_obs[ty][tx] == 3:
                    self.shop_tiles.append((ty, tx))

        if ((self.parsed_message.__contains__("Welcome") and self.parsed_message.__contains__(
                "\"")) or self.parsed_message.__contains__("\"How dare you break my door?\"")) \
                and not 0 <= self.bl_stats.time <= 5:
            self.shop_propagation(self.a_yx)

        if self.bl_stats.max_hitpoints != 0 and (self.bl_stats.hitpoints / self.bl_stats.max_hitpoints) <= 0.5 and not self.safe_play:
            if not self.fast_mode:
                print("SAFE_MODE : enabled")
            self.safe_play = True
        elif self.bl_stats.max_hitpoints != 0 and (self.bl_stats.hitpoints / self.bl_stats.max_hitpoints) > 0.85 and self.safe_play:
            if not self.fast_mode:
                print("SAFE_MODE : disabled")
            self.safe_play = False
        self.act_num += 1
        if self.update_agent():
            self.memory[self.a_yx[0]][self.a_yx[1]] = self.act_num
            if nh.ACTIONS[action_index] == nh.Command.SEARCH:
                self.search_map[self.a_yx[0]][self.a_yx[1]] = 1
                for next_tile in self.neighbors_8_dir(self.a_yx[0], self.a_yx[1]):
                    self.search_map[next_tile[0]][next_tile[1]] = 1
        if not self.fast_mode:  # and x != 10:
            # go_back(27)
            self.env.render()
            # time.sleep(0.05)
        if self.saver:
            self.saver.save_obs_and_action(self.current_obs, action_index)

        self.new_turn = self.bl_stats.time
        self.depth_turns.setdefault(str(self.bl_stats.depth), 0)
        self.depth_turns[str(self.bl_stats.depth)] += abs(self.old_turn - self.new_turn)

        return rew, done, info

    def shop_propagation(self, tile):
        """
            function that propagates the "shop" status to the appropriate tiles starting from the given tile

            :param tile: the starting tile
            :return: //
        """

        for near in self.neighbors_8_dir(tile[0], tile[1]):
            char = self.char_obs[near[0]][near[1]]
            if char in b'|-# ' or (
                    near[0] == self.a_yx[0] and near[1] == self.a_yx[
                    1]):  # or ([58,59,38,39,44].__contains__(char) or 65 <= char <= 90 or 97 <= char <= 122) :
                continue
            elif not self.shop_tiles.__contains__(near):
                self.shop_tiles.append(near)
                self.shop_propagation(near)

    @staticmethod
    def move_translator(from_y, from_x, to_y, to_x):
        """
            function that calculates the move according to the NLE implementation
            needed to move between two given tiles

            :param from_x: x value of the starting tile
            :param from_y: y value of the starting tile
            :param to_x: x value of the destination tile
            :param to_y: y value of the destination tile
            :return: the numerical value of the action to be performed
        """

        if to_y > from_y:  # la y del next è maggiore -> movimenti verso sud
            if to_x > from_x:
                move = nh.CompassDirection.SE
            elif to_x == from_x:
                move = nh.CompassDirection.S
            else:
                move = nh.CompassDirection.SW

        elif to_y == from_y:  # la y del next è uguale -> movimenti verso est ed ovest
            if to_x > from_x:
                move = nh.CompassDirection.E  # e
            else:
                move = nh.CompassDirection.W  # w
        else:  # la y del next è minore -> movimenti verso nord
            if to_x > from_x:
                move = nh.CompassDirection.NE  # ne
            elif to_x == from_x:
                move = nh.CompassDirection.N  # n
            else:
                move = nh.CompassDirection.NW  # nw

        return move

    @staticmethod
    def inverse_move_translator(from_y, from_x, direction):
        """
            function that calculates the destination tile given
            a starting tile and a direction (according to the NLE implementation)

            :param from_x: x value of the starting tile
            :param from_y: y value of the starting tile
            :param direction: the move according to the NLE implementation
            :return: y and x value of the destination tile
        """

        if direction == nh.CompassDirection.N:
            return from_y - 1, from_x
        elif direction == nh.CompassDirection.NE:
            return from_y - 1, from_x + 1
        elif direction == nh.CompassDirection.E:
            return from_y, from_x + 1
        elif direction == nh.CompassDirection.SE:
            return from_y + 1, from_x + 1
        elif direction == nh.CompassDirection.S:
            return from_y + 1, from_x
        elif direction == nh.CompassDirection.SW:
            return from_y + 1, from_x - 1
        elif direction == nh.CompassDirection.W:
            return from_y, from_x - 1
        elif direction == nh.CompassDirection.NW:
            return from_y - 1, from_x - 1

    def reset_game(self):
        """
            function that sets variable values to their initial version,
            preparing the agent for a new game

            :return: //
        """

        self.current_obs = self.env.reset()
        self.new_turn = 0
        self.elbereth_violated = 0
        self.old_turn = 0
        self.update_obs()
        self.reset_memory()
        self.safe_play = False
        self.agent_id = -1
        self.update_agent()
        self.agent_id = self.glyph_obs[self.a_yx[0]][self.a_yx[1]]
        self.memory[self.a_yx[0]][self.a_yx[1]] = self.act_num
        if not self.fast_mode:
            self.env.render()
        self.engraved_tiles = []
        self.inedible = []
        self.shop_tiles = []
        self.u_stairs_locations = []
        self.d_stairs_locations = []
        self.tactical_descent = 0
        self.total_score += self.score
        self.score = 0
        self.recently_killed = []
        self.depth_turns = {}
        self.last_pray = -1

    def partial_reset_game(self):
        """
            function that sets some variable values to their initial version,
            resetting the agent's knowledge of the world

            :return: //
        """

        self.pet_alive = False
        self.update_obs()
        self.reset_memory()
        self.engraved_tiles = []
        self.recently_killed = []
        self.shop_tiles = []
        self.inedible = []

    def get_items_by_class(self, oc_class):
        return (i for i,c in enumerate(self.inv_obs.classes) if c == oc_class)
    
    def get_elbereth_violation(self):
        return self.elbereth_violated

    def set_elbereth_violation(self):
        self.elbereth_violated = self.act_num

    def check_exception(self, tile):
        return self.exception.__contains__((tile[0], tile[1]))

    def append_exception(self, tile):
        self.exception.append(tile)

    def check_engraved(self, tile):
        return self.engraved_tiles.__contains__((tile[0], tile[1]))

    def append_engraved(self, tile):
        self.engraved_tiles.append(tile)

    def check_monster_exception(self, tile):
        return self.monster_exception.__contains__((tile[0], tile[1]))

    def append_monster_exception(self, tile):
        self.monster_exception.append(tile)

    def check_inedible(self, tile):
        return self.inedible.__contains__((tile[0], tile[1]))

    def append_inedible(self, tile):
        self.inedible.append(tile)

    def reset_inedible(self):
        self.inedible = []

    def get_recently_killed(self):
        return self.recently_killed

    def append_recently_killed(self, data):
        self.recently_killed.append(data)

    def remove_recently_killed(self, data):
        self.recently_killed.remove(data)

    def check_recently_ejected(self):
        return self.recently_ejected

    def notify_recently_ejected(self):
        self.recently_ejected = True

    def update_memory(self, y, x):
        self.memory[y][x] = self.act_num

    def clear_memory(self, y, x):
        self.memory[y][x] = -1

    def update_last_monster_searched(self, char, color, times):
        self.last_monster_searched = (char, color, times)

    def get_last_monster_searched(self):
        return self.last_monster_searched

    def get_agent_position(self):
        return self.a_yx

    def get_tactical_descent(self):
        return self.tactical_descent

    def set_tactical_descent(self, turn):
        self.tactical_descent = turn

    def get_size_x(self):
        return self.size_x

    def get_size_y(self):
        return self.size_y

    def get_act_num(self):
        return self.act_num

    def get_memory(self, y, x):
        return self.memory[y][x]

    def get_risk(self, y, x):
        return self.risk_map[y][x]

    def force_risk(self, y, x, risk):
        self.risk_map[y][x] = risk

    def get_glyph(self, y, x):
        return self.glyph_obs[y][x]

    def get_char(self, y, x):
        return self.char_obs[y][x]

    def get_color(self, y, x):
        return self.color_obs[y][x]

    def get_parsed_message(self):
        return self.parsed_message

    def get_bl_stats(self):
        return self.bl_stats

    def get_safe_play(self):
        return self.safe_play

    def get_pet_alive(self):
        return self.pet_alive

    def get_actual_score(self):
        return self.score

    def get_total_score(self):
        return self.total_score

    def get_stairs_locations(self):
        return self.u_stairs_locations, self.d_stairs_locations

    def append_stairs_location(self, stairs, u):
        if u:
            self.u_stairs_locations.append(stairs)
        else:
            self.d_stairs_locations.append(stairs)

    def get_last_pray(self):
        return self.last_pray

    def update_last_pray(self):
        self.last_pray = self.bl_stats.time

    def update_ran(self):
        self.ran = True
        self.ran_turn = self.bl_stats.time

    def reset_ran(self):
        self.ran = False

    def get_ran(self):
        return self.ran

    def get_new_turn(self):
        return self.new_turn

    def get_old_turn(self):
        return self.old_turn

    def get_search_max(self):
        return self.search_max

    def stuck(self):
        self.stuck_counter += 1

    def reset_stuck_counter(self):
        self.stuck_counter = 0

    def get_stuck_counter(self):
        return self.stuck_counter

    def increment_hard_search_num(self):
        self.hard_search_num += 1

    def reset_hard_search_num(self):
        self.hard_search_num = 0

    def get_hard_search_num(self):
        return self.hard_search_num

    def get_fast_mode(self):
        return self.fast_mode

    def get_depth_turns(self, d):
        return self.depth_turns[str(d)]

    def do_panic(self):
        self.panic = True


class DungeonWalker:

    def __init__(self, game):
        self.game = game

    # heuristic function to compute distances in a 8-directional grid
    @staticmethod
    def h_octile_distance(ay, ax, oy, ox):
        """
            function that calculates "octile distance" heuristic for a given tile,
            given an objective tile

            :param ay: starting tile y/vertical coordinate
            :param ax: starting tile x/horiziontal coordinate
            :param oy: objective tile y/vertical coordinate
            :param ox: objective tile x/horiziontal coordinate
            :return: Octile Distance value for the given tile
        """

        x_d = abs(ax - ox)
        y_d = abs(ay - oy)
        return (1.414 * min(x_d, y_d)) + abs(x_d - y_d)

    def a_star(self, oy, ox, safe):
        """
            function implementing A* algorythm

            :param oy: objective tile y/vertical coordinate
            :param ox: objective tile x/horiziontal coordinate
            :return: came_from -> dictionary containing the associations between the tiles of the identified path
                     cost_so_far -> dictionary containing the costs for moving in each tile of the identified path
        """

        # voglio che restituisca il cammino
        # lista di priorità rappresentante la frontiera
        frontier = PriorityQueue()
        agent = self.game.get_agent_position()
        # inizializzo l'algoritmo inserendo nella lista il nodo iniziale (posizione agente) (priorità massima ->0)
        frontier.put(((agent[0], agent[1]), 0))
        # dizionario in cui associo ai nodi il predecessore
        came_from = {}
        # dizionario in cui associo ai nodi il costo f(n) accumalatovi
        cost_so_far = {}
        came_from[(agent[0], agent[1])] = None
        cost_so_far[(agent[0], agent[1])] = 0

        while not frontier.empty():
            current = frontier.get()

            if current == (oy, ox):  # goal reached
                break
            near = self.game.neighbors(current[0][0], current[0][1], safe)
            for next_tile in near:  # for adjacent cell
                new_cost = cost_so_far[current[0]] + 1
                if next_tile not in cost_so_far or new_cost < cost_so_far[next_tile]:
                    cost_so_far[next_tile] = new_cost
                    priority = new_cost + self.h_octile_distance(next_tile[0], next_tile[1], oy, ox)
                    frontier.put((next_tile, priority))
                    came_from[next_tile] = current[0]
        return came_from, cost_so_far

    def path_finder(self, oy, ox, not_reach_diag, safe_play):
        """
            function that calculates "octile distance" heuristic for a given tile,
            given an objective tile

            :param not_reach_diag: flag identifying a tile which cant be reachen diagonally
            :param safe_play: flag identifying the need for a safe play
            :param oy: objective tile y/vertical coordinate
            :param ox: objective tile x/horiziontal coordinate
            :return: the best path found according to game's rules, "A*" and "Octile Distance" heursitic
        """

        yellow_brick_road = list()

        agent = self.game.get_agent_position()
        if self.game.get_risk(agent[0], agent[1]) >= 2 and safe_play:
            return yellow_brick_road

        came_from, cost_so_far = self.a_star(oy, ox, safe_play)
        cursor = (oy, ox)
        next_tile = None
        while cursor is not None:
            if next_tile is not None:

                if not_reach_diag and next_tile[0] == oy and next_tile[1] == ox and next_tile[0] != cursor[0] and \
                        next_tile[1] != cursor[1]:
                    # next node is the goal and must not be reached diagonally
                    if next_tile[0] > cursor[0] and next_tile[1] > cursor[1]:  # y and x greater -> se
                        if self.game.is_walkable(cursor[0], cursor[1] + 1):
                            yellow_brick_road.append(nh.CompassDirection.S)  # s
                            yellow_brick_road.append(nh.CompassDirection.E)  # e
                        elif self.game.is_walkable(cursor[0] + 1, cursor[1]):
                            yellow_brick_road.append(nh.CompassDirection.E)  # e
                            yellow_brick_road.append(nh.CompassDirection.S)  # s
                    elif next_tile[0] > cursor[0] and next_tile[1] < cursor[1]:  # y greater and x smaller -> sw
                        if self.game.is_walkable(cursor[0], cursor[1] - 1):
                            yellow_brick_road.append(nh.CompassDirection.S)  # s
                            yellow_brick_road.append(nh.CompassDirection.W)  # w
                        elif self.game.is_walkable(cursor[0] + 1, cursor[1]):
                            yellow_brick_road.append(nh.CompassDirection.W)  # w
                            yellow_brick_road.append(nh.CompassDirection.S)  # s
                    elif next_tile[0] < cursor[0] and next_tile[1] < cursor[1]:  # y smaller and x greater -> nw
                        if self.game.is_walkable(cursor[0], cursor[1] - 1):
                            yellow_brick_road.append(nh.CompassDirection.N)  # n
                            yellow_brick_road.append(nh.CompassDirection.W)  # w
                        elif self.game.is_walkable(cursor[0] - 1, cursor[1]):
                            yellow_brick_road.append(nh.CompassDirection.W)  # w
                            yellow_brick_road.append(nh.CompassDirection.N)  # n
                    elif next_tile[0] < cursor[0] and next_tile[1] > cursor[1]:  # y smaller and x smaller -> ne
                        if self.game.is_walkable(cursor[0], cursor[1] + 1):
                            yellow_brick_road.append(nh.CompassDirection.N)  # n
                            yellow_brick_road.append(nh.CompassDirection.E)  # e
                        elif self.game.is_walkable(cursor[0] - 1, cursor[1]):
                            yellow_brick_road.append(nh.CompassDirection.E)  # e
                            yellow_brick_road.append(nh.CompassDirection.N)  # n

                yellow_brick_road.append(self.game.move_translator(cursor[0], cursor[1], next_tile[0], next_tile[1]))
            next_tile = cursor
            try:
                cursor = came_from[cursor]
            except:
                return None

        return yellow_brick_road


# method that plans the skill to execute in a given state
def planning(game, skills_prio, skill_map):
    """
        function that plan the best skill to perform, according to the in-game state of the agent
        and the skills priority establied by the user in agent's configuration

        :param game: reference to the core "GameWhisperer" object
        :param skills_prio: starting tile x/horiziontal coordinate
        :param skill_map: objective tile y/vertical coordinate
        :return: skill_name -> a string containing the identification name of the planned skill
                 path -> an optional path useful in planned skill's execution
                 arg1 -> an optional extra argument useful for some skill's execution
    """

    if game.get_new_turn() == game.get_old_turn():
        game.stuck()
    else:
        game.reset_stuck_counter()

    if not game.update_agent():
        return "failure", None, None
    else:
        game.update_obs()

    stats = game.get_bl_stats()
    safe_play = game.get_safe_play()
    agent = game.get_agent_position()

    while len(skills_prio) > 0:
        skill_name = skills_prio.pop(0)
        skill = skill_map[skill_name]

        out = skill.planning(stats, safe_play, agent)
        if out is not None:
            skill_name_o = out[0]
            path = out[1]
            arg1 = out[2]
            if skill_name_o is not None:
                return skill_name, path, arg1

    return "failure", None, None


# methos that executes the planned skills
def main_logic(dungeon_walker, game, skills_prio, skill_map, attempts):
    """
        function that plan the best skill to perform, according to the in-game state of the agent
        and the skills priority establied by the user in agent's configuration

        :param dungeon_walker: reference to the core "DungeonWalker" object
        :param game: reference to the core "GameWhisperer" object
        :param skills_prio: starting tile x/horiziontal coordinate
        :param skill_map: objective tile y/vertical coordinate
        :param attempts: number of games to perform according to agent's configuration
        :return: //
    """

    success = 0
    scores = []
    mediana = 0

    for i in range(0, attempts):

        if game.get_fast_mode():
            if game.get_act_num() != 0 and i != 0:
                scores.append(game.get_actual_score())
                size = len(scores)
                center = math.floor(size / 2)
                scores.sort()
                if (size % 2) == 1:
                    mediana = scores[center]
                else:
                    mediana = (scores[center] + scores[center - 1]) / 2

        done = False
        game.reset_hard_search_num()
        rew = 0
        game.reset_game()
        game.reset_stuck_counter()

        if game.get_fast_mode():
            go_back(3)
            true_divisor = i
            if true_divisor == 0:
                true_divisor = 1
            face = "(ಠ_ಠ)"
            if mediana < 475 and i != 0:
                face = "(╥︣﹏᷅╥)"
            if mediana >= 681:
                face = "(ง'-')ง"
            if mediana >= 756:
                face = "ᕙ(`▿´)ᕗ"
            print("// Mean : ", game.get_total_score() / true_divisor, "// Median: ", mediana, " // Games: ",
                  len(scores), "      ", face, "               ")
            #print(scores)

        while not done:
            skill, path, arg1 = planning(game, skills_prio.copy(), skill_map)
            if not game.get_fast_mode():
                print("SKILL: ", skill, " PATH: ", path)

            if not game.update_agent() or game.get_stuck_counter() > 200:
                break

            agent = game.get_agent_position()
            stats = game.get_bl_stats()

            if skill == "failure":
                hs_n = game.get_hard_search_num()
                if not game.update_agent() or hs_n > 200:
                    break
                elif hs_n > 20:
                    dungeon_walker.panic = True
                    game.do_panic()

                if hs_n % 2 == 0 and hs_n != 0:
                    game.reset_memory()
                game.hard_search()
                game.increment_hard_search_num()
                rew, done, info = game.do_it(nh.Command.SEARCH)  # search per aspettare con value
            else:
                rew, done, info = skill_map[skill].execution(path, arg1, agent, stats)

        if rew == 1:
            success += 1

    if game.saver: game.saver.save_to_file()

def go_back(num_lines):
    print("\033[%dA" % num_lines)