forked from okreng/risk_learning
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathagent.py
More file actions
executable file
·81 lines (64 loc) · 2.45 KB
/
agent.py
File metadata and controls
executable file
·81 lines (64 loc) · 2.45 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
"""
This file contains the agent object for holding multiple q functions
"""
# import all existing policies
from q_funcs.allot import random_allot
from q_funcs.attack import linear_attack_net, max_success
from q_funcs.fortify import random_fortify
import sys, argparse
class Agent():
"""
This class holds three q_func objects
One for each action type
"""
def __init__(self, player_id, territories, act_list, allot_q_func, attack_q_func, fortify_q_func, verbose=True):
"""
Constructor for agent
:param territories: int number of territories on the board
:param allot_policy: string q_func to enact for allot
:param attack_policy: string q_func to enact for attack
:param fortify_policy: string q_func to enact for fortify
:return none:
"""
self.player_id = player_id
self.territories = territories
self.act_list = act_list
if allot_q_func is "random_allot":
self.allot_q_func = random_allot.RandomAllot(self.territories, self.act_list)
else:
print("No valid allot Q function specified")
exit()
if attack_q_func is "max_success":
self.attack_q_func = max_success.MaxSuccess(self.territories, self.act_list)
elif attack_q_func is "linear_attack_net":
# TODO pass in arguments to this function
self.attack_q_func = linear_attack_net.LinearAttackNet(self.territories, self.act_list, '0-56', 15)
else:
print("No valid attack Q function specified")
exit()
if fortify_q_func is "random_fortify":
self.fortify_q_func = random_fortify.RandomFortify(self.territories, self.act_list)
else:
print("No valid attack Q function specified")
exit()
if verbose:
print("Player {} successfully instantiated with Q functions:".format(player_id))
print("\tallot: {}".format(allot_q_func))
print("\tattack: {}".format(attack_q_func))
print("\tfortify: {}".format(fortify_q_func))
return
def parse_arguments():
parser = argparse.ArgumentParser(description='Agent Argument Parser')
parser.add_argument('--train',dest='train',type=bool,default=False)
parser.add_argument('--territories',dest='territories',type=int, default=2)
parser.add_argument('--player',dest='player_id',type=int,default=0)
return parser.parse_args()
def main(args):
args = parse_arguments()
isTraining = args.train
territories = args.territories
player_id = args.player_id
act_list = [[0,1],[-1]]
agent = Agent(player_id, territories, act_list, "random_allot", "linear_attack_net", "random_fortify")
if __name__ == '__main__':
main(sys.argv)