Spaces:
Sleeping
Sleeping
Commit
·
1375e49
1
Parent(s):
46773aa
implement interactive ui
Browse files
app.py
CHANGED
|
@@ -34,28 +34,58 @@ tokenizer = Tokenizer.from_pretrained(tokenizer_path)
|
|
| 34 |
|
| 35 |
invalid_move_plot = Image.open('./invalid_move.png')
|
| 36 |
|
| 37 |
-
def
|
| 38 |
-
|
| 39 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 40 |
pgn_str = StringIO(pgn)
|
| 41 |
try:
|
| 42 |
game = chess.pgn.read_game(pgn_str)
|
| 43 |
board = game.board()
|
| 44 |
for move in game.mainline_moves():
|
| 45 |
board.push(move)
|
| 46 |
-
img = chess.svg.board(board)
|
| 47 |
except Exception as e:
|
| 48 |
if 'illegal san' in str(e):
|
| 49 |
-
return
|
| 50 |
-
|
| 51 |
-
with open(filename + '.svg', 'w') as f:
|
| 52 |
-
f.write(img)
|
| 53 |
-
drawing = svg2rlg(filename + '.svg')
|
| 54 |
-
renderPM.drawToFile(drawing, f"{filename}.png", fmt="PNG")
|
| 55 |
-
plot = Image.open(f'{filename}.png')
|
| 56 |
|
| 57 |
-
|
| 58 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 59 |
return pgn, plot
|
| 60 |
|
| 61 |
|
|
@@ -66,21 +96,71 @@ with gr.Blocks() as demo:
|
|
| 66 |
|
| 67 |
The **C**hess-**P**re-trained-**T**ransformer.
|
| 68 |
|
| 69 |
-
The rules are simple:
|
|
|
|
|
|
|
| 70 |
""")
|
| 71 |
-
|
| 72 |
-
|
| 73 |
-
|
| 74 |
-
|
| 75 |
-
|
| 76 |
-
|
| 77 |
-
|
| 78 |
-
|
| 79 |
-
|
| 80 |
-
|
| 81 |
-
|
| 82 |
-
|
| 83 |
-
|
| 84 |
-
|
| 85 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 86 |
demo.launch()
|
|
|
|
| 34 |
|
| 35 |
invalid_move_plot = Image.open('./invalid_move.png')
|
| 36 |
|
| 37 |
+
def gen_image_from_svg(img, filename):
|
| 38 |
+
with open(filename + '.svg', 'w') as f:
|
| 39 |
+
f.write(img)
|
| 40 |
+
drawing = svg2rlg(filename + '.svg')
|
| 41 |
+
renderPM.drawToFile(drawing, f"{filename}.png", fmt="PNG")
|
| 42 |
+
plot = Image.open(f'{filename}.png')
|
| 43 |
+
|
| 44 |
+
os.remove(f'{filename}.png')
|
| 45 |
+
os.remove(f'{filename}.svg')
|
| 46 |
+
return plot
|
| 47 |
+
|
| 48 |
+
|
| 49 |
+
def get_board(pgn):
|
| 50 |
pgn_str = StringIO(pgn)
|
| 51 |
try:
|
| 52 |
game = chess.pgn.read_game(pgn_str)
|
| 53 |
board = game.board()
|
| 54 |
for move in game.mainline_moves():
|
| 55 |
board.push(move)
|
|
|
|
| 56 |
except Exception as e:
|
| 57 |
if 'illegal san' in str(e):
|
| 58 |
+
return None
|
| 59 |
+
return board
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 60 |
|
| 61 |
+
def gen_board_image(pgn):
|
| 62 |
+
board = get_board(pgn)
|
| 63 |
+
return chess.svg.board(board)
|
| 64 |
+
|
| 65 |
+
def gen_move(pgn):
|
| 66 |
+
model_input = torch.tensor(tokenizer.encode(pgn), dtype=torch.long, device=device).view((1, len(pgn)))
|
| 67 |
+
is_invalid = True
|
| 68 |
+
board = get_board(pgn)
|
| 69 |
+
while is_invalid:
|
| 70 |
+
new_pgn = tokenizer.decode(model.generate(model_input, max_new_tokens=4, context_size=context_size, temperature=0.2)[0].tolist())
|
| 71 |
+
try:
|
| 72 |
+
print(f'checking {new_pgn}')
|
| 73 |
+
mv = new_pgn[len(pgn):].split(' ')[0]
|
| 74 |
+
new_pgn = pgn.rstrip() + f' {mv}'
|
| 75 |
+
is_invalid = get_board(new_pgn) is None
|
| 76 |
+
except Exception:
|
| 77 |
+
is_invalid = True
|
| 78 |
+
print(f'For {pgn} invalid "{new_pgn[len(pgn):].split(" ")[0]}" {new_pgn}')
|
| 79 |
+
#print(mov in board.legal_moves)
|
| 80 |
+
return new_pgn
|
| 81 |
+
|
| 82 |
+
|
| 83 |
+
def generate(prompt):
|
| 84 |
+
model_input = torch.tensor(tokenizer.encode(prompt), dtype=torch.long, device=device).view((1, len(prompt)))
|
| 85 |
+
pgn = tokenizer.decode(model.generate(model_input, max_new_tokens=4, context_size=context_size, temperature=0.2)[0].tolist())
|
| 86 |
+
img = gen_board_image(pgn)
|
| 87 |
+
filename = f'./moves-{str(uuid4())}'
|
| 88 |
+
plot = gen_image_from_svg(img, filename)
|
| 89 |
return pgn, plot
|
| 90 |
|
| 91 |
|
|
|
|
| 96 |
|
| 97 |
The **C**hess-**P**re-trained-**T**ransformer.
|
| 98 |
|
| 99 |
+
The rules are simple:
|
| 100 |
+
- "Interactive": Play a game against the model
|
| 101 |
+
- "Next turn prediction": provide a PGN string of your current game, the model will predict the next token
|
| 102 |
""")
|
| 103 |
+
def manual():
|
| 104 |
+
with gr.Tab("Next turn prediction"):
|
| 105 |
+
prompt = gr.Text(label="PGN")
|
| 106 |
+
output = gr.Text(label="Next turn", interactive=False)
|
| 107 |
+
img = gr.Image()
|
| 108 |
+
submit = gr.Button("Submit")
|
| 109 |
+
submit.click(generate, [prompt], [output, img])
|
| 110 |
+
|
| 111 |
+
gr.Examples(
|
| 112 |
+
[
|
| 113 |
+
["1. e4", ],
|
| 114 |
+
["1. e4 g6 2."],
|
| 115 |
+
],
|
| 116 |
+
inputs=[prompt],
|
| 117 |
+
outputs=[output, img],
|
| 118 |
+
fn=generate
|
| 119 |
+
)
|
| 120 |
+
def interactive():
|
| 121 |
+
with gr.Tab("Interactive"):
|
| 122 |
+
color = gr.Dropdown(["white", "black"], value='white', label="Chose a color")
|
| 123 |
+
start_button = gr.Button("Start Game")
|
| 124 |
+
|
| 125 |
+
def start_game(c):
|
| 126 |
+
pgn = '1. '
|
| 127 |
+
if c == 'black':
|
| 128 |
+
pgn += gen_move(pgn)
|
| 129 |
+
img = gen_board_image(pgn)
|
| 130 |
+
fn = 'foo'
|
| 131 |
+
return gen_image_from_svg(img, fn), pgn, 1
|
| 132 |
+
|
| 133 |
+
state = gr.Text(label='PGN', value='', interactive=False)
|
| 134 |
+
game = gr.Image()
|
| 135 |
+
move_counter = gr.State(value=1)
|
| 136 |
+
start_button.click(
|
| 137 |
+
start_game,
|
| 138 |
+
inputs=[color],
|
| 139 |
+
outputs=[game, state, move_counter]
|
| 140 |
+
)
|
| 141 |
+
|
| 142 |
+
next_move = gr.Text(label='Next move')
|
| 143 |
+
gen_next_move_button = gr.Button("Submit")
|
| 144 |
+
|
| 145 |
+
def gen_next_move(pgn, new_move, move_ctr, c):
|
| 146 |
+
pgn += new_move.strip() + ' '
|
| 147 |
+
if c == 'black':
|
| 148 |
+
move_ctr += 1
|
| 149 |
+
pgn = f'{pgn.rstrip()} {move_ctr}. '
|
| 150 |
+
print(f'gen for {pgn}')
|
| 151 |
+
pgn = gen_move(pgn)
|
| 152 |
+
print(f'got {pgn}')
|
| 153 |
+
img = gen_board_image(pgn)
|
| 154 |
+
if c == 'white':
|
| 155 |
+
move_ctr += 1
|
| 156 |
+
pgn = f'{pgn.rstrip()} {move_ctr}. '
|
| 157 |
+
return gen_image_from_svg(img, 'foo-bar'), pgn, move_ctr
|
| 158 |
+
|
| 159 |
+
gen_next_move_button.click(
|
| 160 |
+
gen_next_move,
|
| 161 |
+
inputs=[state, next_move, move_counter, color],
|
| 162 |
+
outputs=[game, state, move_counter]
|
| 163 |
+
)
|
| 164 |
+
interactive()
|
| 165 |
+
manual()
|
| 166 |
demo.launch()
|
model.py
CHANGED
|
@@ -120,7 +120,7 @@ class DecoderTransformer(nn.Module):
|
|
| 120 |
loss = F.cross_entropy(logits, targets)
|
| 121 |
return logits, loss
|
| 122 |
|
| 123 |
-
def generate(self, idx, max_new_tokens=50, context_size=None):
|
| 124 |
if context_size is None:
|
| 125 |
context_size = int(self.position_embedding_table.weight.shape[0])
|
| 126 |
print(context_size)
|
|
@@ -128,7 +128,7 @@ class DecoderTransformer(nn.Module):
|
|
| 128 |
for _ in range(max_new_tokens):
|
| 129 |
idx_cond = idx[:, -context_size:]
|
| 130 |
logits, loss = self(idx_cond)
|
| 131 |
-
logits = logits[:,-1,:]
|
| 132 |
probs = F.softmax(logits, dim=-1)
|
| 133 |
idx_next = torch.multinomial(probs, num_samples=1)
|
| 134 |
idx = torch.cat([idx, idx_next], dim=1)
|
|
|
|
| 120 |
loss = F.cross_entropy(logits, targets)
|
| 121 |
return logits, loss
|
| 122 |
|
| 123 |
+
def generate(self, idx, max_new_tokens=50, context_size=None, temperature=1.0):
|
| 124 |
if context_size is None:
|
| 125 |
context_size = int(self.position_embedding_table.weight.shape[0])
|
| 126 |
print(context_size)
|
|
|
|
| 128 |
for _ in range(max_new_tokens):
|
| 129 |
idx_cond = idx[:, -context_size:]
|
| 130 |
logits, loss = self(idx_cond)
|
| 131 |
+
logits = logits[:,-1,:] / temperature
|
| 132 |
probs = F.softmax(logits, dim=-1)
|
| 133 |
idx_next = torch.multinomial(probs, num_samples=1)
|
| 134 |
idx = torch.cat([idx, idx_next], dim=1)
|