forked from AlexBai0/MahjongRL
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathMain.py
51 lines (46 loc) · 1.28 KB
/
Main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
from utils.tenhouconnection import Connection
import gym
from QLearning import QLearning as QLe
from gym_mahjong.envs.mahjong_his_env import MahjongEnv
def play():
env = gym.envs.make('Mahjong-v0')
QL = QLe(env)
connection = Connection(QL)
connection.connect()
auth = connection.authencate()
print(auth)
if auth:
connection.play()
else:
connection.end()
# def train_and_play():
# env = gym.envs.make('Mahjong-v0')
# QL = QLe(env)
# validation = []
# for episode in range(300):
# observation = env.reset_()
# while True:
# action = QL.decision(observation)
# observation_after, reward, finish, validate = env.step(action)
# QL.toHistory(observation, action, reward, observation_after)
# validation.append(validate)
# if (episode > 200) and (episode % 5 == 0):
# QL.learn()
# # print('Learned!')
#
# observation = observation_after
#
# if finish:
# break
# connection = Connection(QL)
#
#
# connection.connect()
# auth = connection.authencate()
# print(auth)
# if auth:
# connection.play()
# else:
# connection.end()
if __name__ == '__main__':
play()