GameModel/sim_Series.py at master · wyz2368/GameModel · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
from parallel_sim import parallel_sim
import numpy as np
from load_action import load_action
import file_op as fp
import os


# #TODO: make sure every
# def sim_and_modifiy_Series():
#     print('Begin simulation and modify payoff matrix.')
#     path = os.getcwd() + '/data/game.pkl'
#     game = fp.load_pkl(path)
#     data = sim_and_modifiy(game)
#
#     #TODO: modify payoff matrix
#     old_dim, _ = game.dim_payoff_def()
#     new_dim, _ = game.num_str()
#
#     new_col_def = []
#     new_row_def = []
#     new_col_att = []
#     new_row_att = []
#
#     for i in range(old_dim):
#         aReward_col, dReward_col = data[(i,new_dim-1)]
#         aReward_row, dReward_row = data[(new_dim - 1,i)]
#         new_col_def.append([dReward_col])
#         new_row_def.append(dReward_row)
#         new_col_att.append([aReward_col])
#         new_row_att.append(aReward_row)
#
#     aReward, dReward = data[(new_dim - 1,new_dim - 1)]
#     new_row_def.append(dReward)
#     new_row_att.append(aReward)
#     print("Done simulation and modify payoff matrix.")


def sim_and_modifiy_Series():
    #TODO: make sure this is correct
    print('Begin simulation and modify payoff matrix.')
    path = os.getcwd() + '/data/game.pkl'
    game = fp.load_pkl(path)

    env = game.env
    num_episodes = game.num_episodes

    #TODO: add str first and then calculate payoff
    old_dim, old_dim1 = game.dim_payoff_def()
    new_dim, new_dim1 = game.num_str()
    if old_dim != old_dim1 or new_dim != new_dim1:
        raise ValueError("Payoff dimension does not match.")

    def_str_list = game.def_str
    att_str_list = game.att_str
    dir_def = game.dir_def
    dir_att = game.dir_att

    position_col_list = []
    position_row_list = []
    for i in range(new_dim-1):
        position_col_list.append((i,new_dim-1))
    for j in range(new_dim):
        position_row_list.append((new_dim-1,j))

    # num_tasks = 2 * new_dim - 1

    att_col = []
    att_row = []
    def_col = []
    def_row = []
    #TODO: check the path is correct
    for pos in position_col_list:
        idx_def, idx_att = pos
        str_path_def = dir_def + def_str_list[idx_def]
        str_path_att = dir_att + att_str_list[idx_att]
        nn_def = load_action(str_path_def, game)
        nn_att = load_action(str_path_att, game)
        aReward, dReward = parallel_sim(env, nn_att, nn_def, num_episodes)
        att_col.append(aReward)
        def_col.append(dReward)

    for pos in position_row_list:
        idx_def, idx_att = pos
        str_path_def = dir_def + def_str_list[idx_def]
        str_path_att = dir_att + att_str_list[idx_att]
        nn_def = load_action(str_path_def, game)
        nn_att = load_action(str_path_att, game)
        aReward, dReward = parallel_sim(env, nn_att, nn_def, num_episodes)
        att_row.append(aReward)
        def_row.append(dReward)

    game.add_col_att(np.reshape(np.array(att_col),newshape=(len(att_col),1)))
    game.add_col_def(np.reshape(np.array(def_col), newshape=(len(att_col), 1)))
    game.add_row_att(np.array(att_row))
    game.add_row_def(np.array(def_row))

    fp.save_pkl(game, path = path)
    print("Done simulation and modify payoff matrix.")