Update app.py
Browse files
app.py
CHANGED
@@ -116,10 +116,10 @@ demo = gr.Interface(
|
|
116 |
fn=step_episode,
|
117 |
inputs=gr.State(value=[START_POSITION, []]),
|
118 |
outputs=[board, state_fen, move_history, gr.State()],
|
119 |
-
title="♜ RookWorld Self-Play Demo",
|
120 |
-
description="""♜ RookWorld (GPT2-124M) Unified Policy &
|
121 |
-
Both the *policy actions* and the *environment response* (
|
122 |
-
Click the **Generate**-button to generate a new move and environment response. On CPU this can take 30 seconds per step.""",
|
123 |
allow_flagging="never",
|
124 |
analytics_enabled=False,
|
125 |
submit_btn="Generate",
|
|
|
116 |
fn=step_episode,
|
117 |
inputs=gr.State(value=[START_POSITION, []]),
|
118 |
outputs=[board, state_fen, move_history, gr.State()],
|
119 |
+
title="♜ RookWorld-LM-124M Self-Play Demo",
|
120 |
+
description="""♜ RookWorld-LM (GPT2-124M) Unified Policy & World Model
|
121 |
+
Both the *policy actions* (with generated CoT) and the *environment response* (World Model) are fully generated by a single language model.
|
122 |
+
Click the **Generate**-button to generate a new move and environment response. On CPU this can take ~30 seconds per step.""",
|
123 |
allow_flagging="never",
|
124 |
analytics_enabled=False,
|
125 |
submit_btn="Generate",
|