Spaces:
Sleeping
Sleeping
sjz
commited on
Commit
·
d8f258e
1
Parent(s):
d97a106
fix AI vs AI bug
Browse files- const.py +6 -1
- pages/AI_VS_AI.py +75 -50
const.py
CHANGED
@@ -36,6 +36,11 @@ _PLAYER_COLOR = {
|
|
36 |
_BLANK: "Blank",
|
37 |
_BLACK: "YOU HUMAN",
|
38 |
}
|
|
|
|
|
|
|
|
|
|
|
39 |
_HORIZONTAL = np.array(
|
40 |
[
|
41 |
[0, 0, 0, 0, 0],
|
@@ -87,6 +92,6 @@ _ROOM_COLOR = {
|
|
87 |
|
88 |
_MODEL_PATH = {
|
89 |
"AlphaZero": "Gomoku_MCTS/checkpoint/2023-12-14-18-17-07_test_teaching_learning_collect_epochs=1000_size=9_model=normal/best_policy.model",
|
90 |
-
"duel": "
|
91 |
"Gumbel AlphaZero": "Gomoku_MCTS/checkpoint/2023-12-14-21-19-40_selfplay_epochs=1000_size=9_model=gumbel/best_policy.model",
|
92 |
}
|
|
|
36 |
_BLANK: "Blank",
|
37 |
_BLACK: "YOU HUMAN",
|
38 |
}
|
39 |
+
_PLAYER_COLOR_AI_VS_AI = {
|
40 |
+
_WHITE: "WHITE",
|
41 |
+
_BLANK: "Blank",
|
42 |
+
_BLACK: "BLACK",
|
43 |
+
}
|
44 |
_HORIZONTAL = np.array(
|
45 |
[
|
46 |
[0, 0, 0, 0, 0],
|
|
|
92 |
|
93 |
_MODEL_PATH = {
|
94 |
"AlphaZero": "Gomoku_MCTS/checkpoint/2023-12-14-18-17-07_test_teaching_learning_collect_epochs=1000_size=9_model=normal/best_policy.model",
|
95 |
+
"duel": "Gomoku_MCTS/checkpoint/2023-12-14-10-22-12_test_teaching_learning_collect_epochs=1000_size=9_model=duel/best_policy.model",
|
96 |
"Gumbel AlphaZero": "Gomoku_MCTS/checkpoint/2023-12-14-21-19-40_selfplay_epochs=1000_size=9_model=gumbel/best_policy.model",
|
97 |
}
|
pages/AI_VS_AI.py
CHANGED
@@ -24,7 +24,7 @@ from const import (
|
|
24 |
_BLACK, # 1, for human
|
25 |
_WHITE, # 2 , for AI
|
26 |
_BLANK,
|
27 |
-
|
28 |
_PLAYER_SYMBOL1,
|
29 |
_PLAYER_SYMBOL2,
|
30 |
_ROOM_COLOR,
|
@@ -438,38 +438,50 @@ def gomoku():
|
|
438 |
in session_state.ROOM.COORDINATE_1D
|
439 |
):
|
440 |
if i == gpt_i and j == gpt_j:
|
441 |
-
BOARD_PLATE[i][j].button(
|
442 |
-
|
443 |
-
|
444 |
-
|
445 |
-
|
|
|
|
|
|
|
446 |
)
|
447 |
else:
|
448 |
# disable click for GPT choices
|
449 |
-
BOARD_PLATE[i][j].button(
|
450 |
-
|
451 |
-
|
452 |
-
|
453 |
-
|
|
|
|
|
|
|
454 |
)
|
455 |
else:
|
456 |
if session_state.USE_AIAID and i * _BOARD_SIZE + j in top_five_acts and not \
|
457 |
session_state.ROOM.BOARD.game_end()[0]:
|
458 |
# enable click for other cells available for human choices
|
459 |
prob = top_five_probs[top_five_acts.index(i * _BOARD_SIZE + j)]
|
460 |
-
BOARD_PLATE[i][j].button(
|
461 |
-
|
462 |
-
|
463 |
-
|
464 |
-
|
|
|
|
|
|
|
465 |
)
|
466 |
else:
|
467 |
# enable click for other cells available for human choices
|
468 |
-
BOARD_PLATE[i][j].button(
|
469 |
-
|
470 |
-
|
471 |
-
|
472 |
-
|
|
|
|
|
|
|
473 |
)
|
474 |
|
475 |
message.markdown(
|
@@ -512,7 +524,6 @@ def gomoku():
|
|
512 |
print("AI's move is located at ({}, {}) :".format(gpt_i, gpt_j))
|
513 |
move = session_state.ROOM.BOARD.location_to_move((gpt_i, gpt_j))
|
514 |
print("Location to move: ", move)
|
515 |
-
# print("Location to move: ", move)
|
516 |
# MCTS BOARD
|
517 |
session_state.ROOM.BOARD.do_move(move)
|
518 |
# Gomoku Bot BOARD
|
@@ -541,38 +552,50 @@ def gomoku():
|
|
541 |
in session_state.ROOM.COORDINATE_1D
|
542 |
):
|
543 |
if i == gpt_i and j == gpt_j:
|
544 |
-
BOARD_PLATE[i][j].button(
|
545 |
-
|
546 |
-
|
547 |
-
|
548 |
-
|
|
|
|
|
|
|
549 |
)
|
550 |
else:
|
551 |
# disable click for GPT choices
|
552 |
-
BOARD_PLATE[i][j].button(
|
553 |
-
|
554 |
-
|
555 |
-
|
556 |
-
|
|
|
|
|
|
|
557 |
)
|
558 |
else:
|
559 |
if session_state.USE_AIAID and i * _BOARD_SIZE + j in top_five_acts and not \
|
560 |
session_state.ROOM.BOARD.game_end()[0]:
|
561 |
# enable click for other cells available for human choices
|
562 |
prob = top_five_probs[top_five_acts.index(i * _BOARD_SIZE + j)]
|
563 |
-
BOARD_PLATE[i][j].button(
|
564 |
-
|
565 |
-
|
566 |
-
|
567 |
-
|
|
|
|
|
|
|
568 |
)
|
569 |
else:
|
570 |
# enable click for other cells available for human choices
|
571 |
-
BOARD_PLATE[i][j].button(
|
572 |
-
|
573 |
-
|
574 |
-
|
575 |
-
|
|
|
|
|
|
|
576 |
)
|
577 |
|
578 |
message.markdown(
|
@@ -623,21 +646,23 @@ def gomoku():
|
|
623 |
# Infos
|
624 |
def update_info() -> None:
|
625 |
# Additional information
|
626 |
-
SCORE_PLATE[0].metric("Gomoku-Agent", session_state.ROOM.HISTORY[0])
|
627 |
-
SCORE_PLATE[1].metric("Black", session_state.ROOM.HISTORY[1])
|
628 |
if session_state.ROOM.WINNER != _BLANK:
|
629 |
st.balloons()
|
630 |
ROUND_INFO.write(
|
631 |
-
f"#### **{
|
632 |
)
|
633 |
st.markdown("<br>", unsafe_allow_html=True)
|
634 |
st.markdown("<br>", unsafe_allow_html=True)
|
635 |
chart_data = pd.DataFrame(session_state.ROOM.ai_simula_time_list, columns=["Simulation Time"])
|
636 |
-
|
637 |
-
|
638 |
-
|
639 |
-
|
640 |
-
|
|
|
|
|
|
|
|
|
641 |
|
642 |
if __name__ == "__main__":
|
643 |
gomoku()
|
|
|
24 |
_BLACK, # 1, for human
|
25 |
_WHITE, # 2 , for AI
|
26 |
_BLANK,
|
27 |
+
_PLAYER_COLOR_AI_VS_AI,
|
28 |
_PLAYER_SYMBOL1,
|
29 |
_PLAYER_SYMBOL2,
|
30 |
_ROOM_COLOR,
|
|
|
438 |
in session_state.ROOM.COORDINATE_1D
|
439 |
):
|
440 |
if i == gpt_i and j == gpt_j:
|
441 |
+
# BOARD_PLATE[i][j].button(
|
442 |
+
# session_state.Symbol[_NEW],
|
443 |
+
# key=f"{i}:{j}",
|
444 |
+
# args=(i, j),
|
445 |
+
# on_click=forbid_click,
|
446 |
+
# )
|
447 |
+
BOARD_PLATE[i][j].write(
|
448 |
+
session_state.Symbol[_NEW]
|
449 |
)
|
450 |
else:
|
451 |
# disable click for GPT choices
|
452 |
+
# BOARD_PLATE[i][j].button(
|
453 |
+
# session_state.Symbol[cell],
|
454 |
+
# key=f"{i}:{j}",
|
455 |
+
# args=(i, j),
|
456 |
+
# on_click=forbid_click
|
457 |
+
# )
|
458 |
+
BOARD_PLATE[i][j].write(
|
459 |
+
session_state.Symbol[cell]
|
460 |
)
|
461 |
else:
|
462 |
if session_state.USE_AIAID and i * _BOARD_SIZE + j in top_five_acts and not \
|
463 |
session_state.ROOM.BOARD.game_end()[0]:
|
464 |
# enable click for other cells available for human choices
|
465 |
prob = top_five_probs[top_five_acts.index(i * _BOARD_SIZE + j)]
|
466 |
+
# BOARD_PLATE[i][j].button(
|
467 |
+
# session_state.Symbol[cell] + f"({round(prob, 2)})",
|
468 |
+
# key=f"{i}:{j}",
|
469 |
+
# on_click=forbid_click,
|
470 |
+
# args=(i, j),
|
471 |
+
# )
|
472 |
+
BOARD_PLATE[i][j].write(
|
473 |
+
session_state.Symbol[cell]
|
474 |
)
|
475 |
else:
|
476 |
# enable click for other cells available for human choices
|
477 |
+
# BOARD_PLATE[i][j].button(
|
478 |
+
# session_state.Symbol[cell],
|
479 |
+
# key=f"{i}:{j}",
|
480 |
+
# on_click=forbid_click,
|
481 |
+
# args=(i, j),
|
482 |
+
# )
|
483 |
+
BOARD_PLATE[i][j].write(
|
484 |
+
session_state.Symbol[cell]
|
485 |
)
|
486 |
|
487 |
message.markdown(
|
|
|
524 |
print("AI's move is located at ({}, {}) :".format(gpt_i, gpt_j))
|
525 |
move = session_state.ROOM.BOARD.location_to_move((gpt_i, gpt_j))
|
526 |
print("Location to move: ", move)
|
|
|
527 |
# MCTS BOARD
|
528 |
session_state.ROOM.BOARD.do_move(move)
|
529 |
# Gomoku Bot BOARD
|
|
|
552 |
in session_state.ROOM.COORDINATE_1D
|
553 |
):
|
554 |
if i == gpt_i and j == gpt_j:
|
555 |
+
# BOARD_PLATE[i][j].button(
|
556 |
+
# session_state.Symbol[_NEW],
|
557 |
+
# key=f"{i}:{j}",
|
558 |
+
# args=(i, j),
|
559 |
+
# on_click=forbid_click,
|
560 |
+
# )
|
561 |
+
BOARD_PLATE[i][j].write(
|
562 |
+
session_state.Symbol[_NEW]
|
563 |
)
|
564 |
else:
|
565 |
# disable click for GPT choices
|
566 |
+
# BOARD_PLATE[i][j].button(
|
567 |
+
# session_state.Symbol[cell],
|
568 |
+
# key=f"{i}:{j}",
|
569 |
+
# args=(i, j),
|
570 |
+
# on_click=forbid_click
|
571 |
+
# )
|
572 |
+
BOARD_PLATE[i][j].write(
|
573 |
+
session_state.Symbol[cell]
|
574 |
)
|
575 |
else:
|
576 |
if session_state.USE_AIAID and i * _BOARD_SIZE + j in top_five_acts and not \
|
577 |
session_state.ROOM.BOARD.game_end()[0]:
|
578 |
# enable click for other cells available for human choices
|
579 |
prob = top_five_probs[top_five_acts.index(i * _BOARD_SIZE + j)]
|
580 |
+
# BOARD_PLATE[i][j].button(
|
581 |
+
# session_state.Symbol[cell] + f"({round(prob, 2)})",
|
582 |
+
# key=f"{i}:{j}",
|
583 |
+
# on_click=forbid_click,
|
584 |
+
# args=(i, j),
|
585 |
+
# )
|
586 |
+
BOARD_PLATE[i][j].write(
|
587 |
+
session_state.Symbol[cell]
|
588 |
)
|
589 |
else:
|
590 |
# enable click for other cells available for human choices
|
591 |
+
# BOARD_PLATE[i][j].button(
|
592 |
+
# session_state.Symbol[cell],
|
593 |
+
# key=f"{i}:{j}",
|
594 |
+
# on_click=forbid_click,
|
595 |
+
# args=(i, j),
|
596 |
+
# )
|
597 |
+
BOARD_PLATE[i][j].write(
|
598 |
+
session_state.Symbol[cell]
|
599 |
)
|
600 |
|
601 |
message.markdown(
|
|
|
646 |
# Infos
|
647 |
def update_info() -> None:
|
648 |
# Additional information
|
|
|
|
|
649 |
if session_state.ROOM.WINNER != _BLANK:
|
650 |
st.balloons()
|
651 |
ROUND_INFO.write(
|
652 |
+
f"#### **{_PLAYER_COLOR_AI_VS_AI[session_state.ROOM.WINNER]} WIN!**\n**Click buttons on the left for more plays.**"
|
653 |
)
|
654 |
st.markdown("<br>", unsafe_allow_html=True)
|
655 |
st.markdown("<br>", unsafe_allow_html=True)
|
656 |
chart_data = pd.DataFrame(session_state.ROOM.ai_simula_time_list, columns=["Simulation Time"])
|
657 |
+
chart_placeholder.line_chart(chart_data)
|
658 |
+
|
659 |
+
|
660 |
+
chart_placeholder = st.empty()
|
661 |
+
while session_state.ROOM.WINNER == _BLANK:
|
662 |
+
game_control()
|
663 |
+
update_info()
|
664 |
+
SCORE_PLATE[0].metric("Gomoku-Agent", session_state.ROOM.HISTORY[0])
|
665 |
+
SCORE_PLATE[1].metric("Black", session_state.ROOM.HISTORY[1])
|
666 |
|
667 |
if __name__ == "__main__":
|
668 |
gomoku()
|