Spaces:

lcipolina
/

LLM_OpenSpiel_Arena

Sleeping

App Files Files Community

LLM_OpenSpiel_Arena / utils /llm_utils.py

lcipolina

Upload 2 files

2f86234 verified 4 months ago

raw

history blame contribute delete

1.99 kB

	# utils/llm_utils.py
	"""Utility functions for Large Language Model (LLM) integration.

	This module provides helper functions to generate prompts and interact with LLMs
	for decision-making in game simulations.
	"""

	from functools import lru_cache
	from typing import List, Any
	import random

	def generate_prompt(game_name: str, state: str, legal_actions: List[int]) -> str:
	"""Generate a natural language prompt for the LLM to decide the next move.

	Args:
	game_name: The name of the game.
	state: The current game state as a string.
	legal_actions: The list of legal actions available to the player.

	Returns:
	str: A prompt string for the LLM.
	"""
	prompt = (
	f"You are playing the Game: {game_name}\n"
	f"State:\n{state}\n"
	f"Legal actions: {legal_actions}\n"
	"Your task is to choose the next action (provide the action number answer with only the number of your next move from the list of legal actions. Do not provide any additional text or explanation."
	)
	return prompt


	@lru_cache(maxsize=128)
	def llm_decide_move(llm: Any, prompt: str, legal_actions: tuple) -> int:
	"""Use an LLM to decide the next move, with caching for repeated prompts.

	Args:
	llm: The LLM pipeline instance (e.g., from Hugging Face).
	prompt: The prompt string provided to the LLM.
	legal_actions: The list of legal actions available (converted to tuple).

	Returns:
	int: The action selected by the LLM.
	"""

	# TODO(lkun): test this: temperature = 0.1 #less creative

	response = llm(prompt, max_new_tokens=30, pad_token_id=50256)[0]["generated_text"]
	for word in response.split():
	try:
	move = int(word)
	if move in legal_actions: # Validate the move against legal actions
	return move
	except ValueError:
	continue

	return random.choice(legal_actions) # Fallback if no valid move is found