Spaces:

lcipolina
/

LLM_OpenSpiel_Arena

Running

App Files Files Community

lcipolina commited on Jan 7

Commit

2f86234

verified ·

1 Parent(s): e933c26

Upload 2 files

Browse files

Files changed (2) hide show

utils/common_utils.py +29 -0
utils/llm_utils.py +56 -0

utils/common_utils.py ADDED Viewed

	@@ -0,0 +1,29 @@

+# utils/common_utils.py
+"""Common utility functions for the OpenSpiel LLM Arena project.
+This module provides shared utility functions for logging, configuration,
+and other cross-cutting concerns.
+"""
+import logging
+def setup_logger(name: str) -> logging.Logger:
+    """Sets up a logger for the simulation.
+    Args:
+        name: The name of the logger.
+    Returns:
+        logging.Logger: Configured logger instance.
+    """
+    logger = logging.getLogger(name)
+    if not logger.handlers:
+        handler = logging.StreamHandler()
+        formatter = logging.Formatter(
+            "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
+        )
+        handler.setFormatter(formatter)
+        logger.addHandler(handler)
+        logger.setLevel(logging.INFO)
+    return logger

utils/llm_utils.py ADDED Viewed

	@@ -0,0 +1,56 @@

+# utils/llm_utils.py
+"""Utility functions for Large Language Model (LLM) integration.
+This module provides helper functions to generate prompts and interact with LLMs
+for decision-making in game simulations.
+"""
+from functools import lru_cache
+from typing import List, Any
+import random
+def generate_prompt(game_name: str, state: str, legal_actions: List[int]) -> str:
+    """Generate a natural language prompt for the LLM to decide the next move.
+    Args:
+        game_name: The name of the game.
+        state: The current game state as a string.
+        legal_actions: The list of legal actions available to the player.
+    Returns:
+        str: A prompt string for the LLM.
+    """
+    prompt =  (
+         f"You are playing the Game: {game_name}\n"
+         f"State:\n{state}\n"
+         f"Legal actions: {legal_actions}\n"
+         "Your task is to choose the next action (provide the action number answer with only the number of your next move from the list of legal actions. Do not provide any additional text or explanation."
+     )
+    return prompt
+@lru_cache(maxsize=128)
+def llm_decide_move(llm: Any, prompt: str, legal_actions: tuple) -> int:
+    """Use an LLM to decide the next move, with caching for repeated prompts.
+    Args:
+        llm: The LLM pipeline instance (e.g., from Hugging Face).
+        prompt: The prompt string provided to the LLM.
+        legal_actions: The list of legal actions available (converted to tuple).
+    Returns:
+        int: The action selected by the LLM.
+    """
+    # TODO(lkun): test this: temperature = 0.1 #less creative
+    response = llm(prompt, max_new_tokens=30, pad_token_id=50256)[0]["generated_text"]
+    for word in response.split():
+         try:
+             move = int(word)
+             if move in legal_actions:  # Validate the move against legal actions
+                 return move
+         except ValueError:
+             continue
+    return random.choice(legal_actions)   # Fallback if no valid move is found