forked from GeorgePik/POMCP
-
Notifications
You must be signed in to change notification settings - Fork 0
/
auxilliary.py
99 lines (82 loc) · 3.31 KB
/
auxilliary.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
# Auxilliary code
import numpy as np
from itertools import chain, combinations
# builds a tree
class BuildTree():
def __init__(self, giveParameters = ['isRoot', {}, 0, 0, []] ): #add init dist
# index for nodes
self.count = -1
self.nodes = {}
# dictionary where key is node and value is list of corresponding values
# = [ parent, children, Nc, Value, B() (-1) if action node]
self.giveParameters = []
# Create instance attributes for initialization
# This is necessary to avoid multiple instances sharing same
# Attributes
for i in giveParameters:
if type(i) == str or type(i) == int:
self.giveParameters.append(i)
else:
self.giveParameters.append(i.copy())
self.nodes[self.count] = self.giveParameters
# Expand the tree by one node.
# If the result of an action give IsAction = True
def ExpandTreeFrom(self, parent, index, IsAction = False):
self.count += 1
if IsAction:
# add node to tree
self.nodes[self.count] = [parent, {}, 0, 0, -1]
# inform parent node
self.nodes[parent][1][index] = self.count
else:
self.nodes[self.count] = [parent, {}, 0, 0, []]
self.nodes[parent][1][index] = self.count
# Check given nodeindex corresponds to leaf node
def isLeafNode(self, n):
if self.nodes[n][2] == 0:
return True
else:
return False
# As in POMCP/ Checks that an observation was already made before moving
def getObservationNode(self,h,sample_observation):
# Check if a given observation node has been visited
if sample_observation not in list(self.nodes[h][1].keys()):
# If not create the node
self.ExpandTreeFrom(h, sample_observation)
# Get the nodes index
Next_node = self.nodes[h][1][sample_observation]
return Next_node
# Removes a node and
def prune(self, node):
children = self.nodes[node][1]
del self.nodes[node]
for _, child in children.items():
self.prune(child)
# make new root and update children
def make_new_root(self, new_root):
self.nodes[-1] = self.nodes[new_root].copy()
del self.nodes[new_root]
self.nodes[-1][0] = 'isRoot'
# update children
for _ , child in self.nodes[-1][1].items():
self.nodes[child][0] = -1
# Prune tree after action and observation were made
def prune_after_action(self, action, observation):
# Get node after action
action_node = self.nodes[-1][1][action]
# Get new root (after observation)
new_root = self.getObservationNode(action_node, observation)
# remove new_root from parent's children to avoid deletion
del self.nodes[action_node][1][observation]
# prune unnesecary nodes
self.prune(-1)
# set new_root as root (key = -1)
self.make_new_root(new_root)
#UCB score calculation
def UCB(N,n,V,c = 1): #N=Total, n= local, V = value, c = parameter
return V + c*np.sqrt(np.log(N)/n)
# from itertools recipes
# creates power set
def powerset(iterable):
s = list(iterable)
return chain.from_iterable(combinations(s, r) for r in range(len(s)+1))