Spaces:

nuriyev
/

chess

Running on Zero

App Files Files Community

chess / app.py

nuriyev

use correct template var

5f16693 9 days ago

raw

history blame contribute delete

8.07 kB

	import re
	import chess
	import gradio as gr
	import spaces
	from jinja2 import Template
	from gradio_chessboard import Chessboard
	import torch
	from transformers import AutoModelForCausalLM, AutoTokenizer

	# ============================================================================
	# Model Loading
	# ============================================================================

	MODEL_ID = "nuriyev/chess-reasoner-grpo"

	print("Loading model...")
	tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
	model = AutoModelForCausalLM.from_pretrained(
	MODEL_ID,
	torch_dtype=torch.float16,
	device_map="auto",
	trust_remote_code=True,
	revision="b7e531a630fd35065f9c8287f4bd21dff42f871b",
	)
	model.eval()
	print("Model loaded!")


	# ============================================================================
	# Prompts (matching training exactly)
	# ============================================================================

	USER_PROMPT = Template("""You are an expert chess player.

	Given a current game state, you must select the best legal next move. Think in 1-2 sentences, then output your chosen move.

	## State

	Board:
	{% set fen_board = FEN.split()[0] %}
	{%- set ns = namespace(board='') -%}
	{%- for char in fen_board -%}
	{%- if char in '12345678' -%}
	{%- set ns.board = ns.board ~ '.' * (char\|int) -%}
	{%- elif char != '/' -%}
	{%- set ns.board = ns.board ~ char -%}
	{%- endif -%}
	{%- endfor -%}
	{#- Output coordinate grid by file -#}
	{%- set files = 'abcdefgh' -%}
	{% for f in range(8) %}
	{%- for r in range(1, 9) -%}
	{{ files[f] }}{{ r }}:{{ ns.board[(8-r)*8 + f] }}{% if r < 8 %} {% endif -%}
	{%- endfor %}
	{% endfor %}
	Turn: It is your turn ({{ side_to_move }})
	Legal Moves: {{ legal_moves_uci }}

	## Output format

	<reason>...brief thinking (1-2 first-person very short concise sentences, identifying threat or opportunity, then deciding on the best move to play next)...</reason>
	<uci_move>...your_move...</uci_move>

	NOTE: capital letters are white, lowercase are black.""")


	# ============================================================================
	# Model Inference
	# ============================================================================

	@spaces.GPU
	def get_model_move(fen: str) -> tuple[str, str, str]:
	"""Get model's move for the given position. Returns (uci_move, reasoning, raw_output)."""
	board = chess.Board(fen)
	turn = "white" if board.turn else "black"

	messages = [
	{"role": "user", "content": USER_PROMPT.render(
	FEN=fen,
	side_to_move=turn,
	legal_moves_uci=", ".join([move.uci()
	for move in board.legal_moves])
	)},
	]

	text = tokenizer.apply_chat_template(
	messages,
	tokenize=False,
	add_generation_prompt=True,
	)

	inputs = tokenizer(text, return_tensors="pt").to(model.device)

	with torch.no_grad():
	outputs = model.generate(
	**inputs,
	max_new_tokens=256,
	temperature=0.7,
	top_p=0.8,
	top_k=20,
	do_sample=True,
	pad_token_id=tokenizer.pad_token_id,
	)

	generated = tokenizer.decode(
	outputs[0][inputs['input_ids'].shape[1]:], skip_special_tokens=False)

	# Parse the output
	think_match = re.search(r'<reason>(.*?)</reason>', generated, re.DOTALL)
	move_match = re.search(r'<uci_move>(.*?)</uci_move>', generated)

	reasoning = think_match.group(1).strip(
	) if think_match else "No reasoning provided"
	uci_move = move_match.group(1).strip() if move_match else None

	# Clean up raw output for display
	raw_output = generated.split('<\|im_end\|>')[0].strip()

	return uci_move, reasoning, raw_output


	# ============================================================================
	# Game Logic
	# ============================================================================

	def play_move(fen: str) -> tuple[str, str, str, str]:
	"""
	Process the position after player's move and get AI response.
	Returns: (new_fen, status, reasoning, raw_output)
	"""
	board = chess.Board(fen)

	# Check if game is over
	if board.is_game_over():
	result = get_game_result(board)
	return fen, f"🏁 {result}", "", ""

	# If it's black's turn (AI), make a move
	if not board.turn:
	uci_move, reasoning, raw_output = get_model_move(fen)

	if uci_move:
	try:
	move = chess.Move.from_uci(uci_move)
	if move in board.legal_moves:
	board.push(move)
	else:
	reasoning = f"⚠️ Model suggested illegal move: {uci_move}. " + reasoning
	except:
	reasoning = f"⚠️ Model output invalid move: {uci_move}. " + reasoning

	# Check if game is over after AI move
	if board.is_game_over():
	result = get_game_result(board)
	return board.fen(), f"🏁 {result}", reasoning, raw_output

	turn_str = "White (You)" if board.turn else "Black (AI)"
	status = f"Turn: {turn_str}"
	if board.is_check():
	status += " ⚠️ CHECK!"

	return board.fen(), status, reasoning, raw_output

	# White's turn - just return current state, preserve reasoning display
	turn_str = "White (You)" if board.turn else "Black (AI)"
	status = f"Turn: {turn_str}"
	if board.is_check():
	status += " ⚠️ CHECK!"

	return fen, status, gr.update(), gr.update()


	def get_game_result(board: chess.Board) -> str:
	"""Get the game result string."""
	if board.is_checkmate():
	winner = "Black" if board.turn else "White"
	return f"Checkmate! {winner} wins!"
	elif board.is_stalemate():
	return "Stalemate - Draw"
	elif board.is_insufficient_material():
	return "Draw - Insufficient material"
	elif board.is_fifty_moves():
	return "Draw - 50 move rule"
	elif board.is_repetition():
	return "Draw - Repetition"
	return "Game Over"


	def reset_game() -> tuple[str, str, str, str]:
	"""Reset to starting position."""
	return chess.STARTING_FEN, "Turn: White (You)", "", ""


	def ai_plays_first() -> tuple[str, str, str, str]:
	"""Let AI make the opening move."""
	return play_move(chess.STARTING_FEN)


	# ============================================================================
	# Gradio Interface
	# ============================================================================

	with gr.Blocks(title="♟️ Chess Reasoner") as demo:
	gr.Markdown("""
	# ♟️ Chess Reasoner
	Play chess against a reasoning AI! You play as White - click on pieces to move them.
	""")

	with gr.Row():
	with gr.Column(scale=2):
	board = Chessboard(value=chess.STARTING_FEN,
	label="", game_mode=True)

	with gr.Column(scale=1):
	status = gr.Markdown(value="Turn: White (You)")

	with gr.Row():
	reset_btn = gr.Button("🔄 New Game", variant="primary")
	ai_first_btn = gr.Button("🤖 AI First")

	with gr.Accordion("🧠 AI Reasoning", open=True):
	reasoning = gr.Textbox(
	label="Thinking", lines=3, interactive=False)

	with gr.Accordion("📝 Raw Output", open=False):
	raw_output = gr.Textbox(
	label="Model Output", lines=5, interactive=False)

	gr.Markdown("""
	---
	Model: [nuriyev/chess-reasoner-grpo](https://huggingface.co/nuriyev/chess-reasoner-grpo) • Fine-tuned from Qwen3-4B-Instruct
	""")

	# Events
	board.change(
	fn=play_move,
	inputs=[board],
	outputs=[board, status, reasoning, raw_output]
	)

	reset_btn.click(
	fn=reset_game,
	outputs=[board, status, reasoning, raw_output]
	)

	ai_first_btn.click(
	fn=ai_plays_first,
	outputs=[board, status, reasoning, raw_output]
	)

	if __name__ == "__main__":
	demo.launch(ssr_mode=False)