Merge branch 'merge-main' of https://github.com/icwhite/mindcraft into merge-main

2025-06-08 10:15:55 +02:00 · 2025-05-03 15:06:29 -07:00 · 2025-05-03 15:06:29 -07:00 · bafef3bff2
commit bafef3bff2
parent 29b946b8be e4eb595a8b
1 changed files with 495 additions and 0 deletions
--- a/tasks/cooking_tasks/hells_kitchen_tasks.py
+++ b/tasks/cooking_tasks/hells_kitchen_tasks.py
@ -0,0 +1,495 @@
+import random
+import json
+from typing import Dict, List, Any, Tuple, Set
+from collections import Counter, defaultdict
+
+# Define your COOKING_ITEMS dictionary here
+# This is where you should put your complete COOKING_ITEMS dictionary
+COOKING_ITEMS = {
+# Cooked Meats
+"cooked_mutton": {
+    "recipe": [
+        "Step 1: Kill a sheep and pick up 1 mutton that is dropped.", 
+        "Step 2: Go to furnace and use it to cook the mutton."
+    ],
+    "description": "Cooked mutton meat",
+    "complexity": "easy"
+},
+"cooked_beef": {
+    "recipe": [
+        "Step 1: Kill a cow and pick up 1 beef that is dropped.",
+        "Step 2: Go to furnace and use it to cook the beef."
+    ],
+    "description": "Cooked beef meat",
+    "complexity": "easy"
+},
+"cooked_porkchop": {
+    "recipe": [
+        "Step 1: Kill a pig and pick up 1 porkchop that is dropped.",
+        "Step 2: Go to furnace and use it to cook the porkchop."
+    ],
+    "description": "Cooked porkchop",
+    "complexity": "easy"
+},
+"cooked_chicken": {
+    "recipe": [
+        "Step 1: Kill a chicken and pick up 1 raw chicken that is dropped.",
+        "Step 2: Go to furnace and use it to cook the raw chicken."
+    ],
+    "description": "Cooked chicken meat",
+    "complexity": "easy"
+},
+"cooked_rabbit": {
+    "recipe": [
+        "Step 1: Kill a rabbit and pick up 1 raw rabbit that is dropped.",
+        "Step 2: Go to furnace and use it to cook the raw rabbit."
+    ],
+    "description": "Cooked rabbit meat",
+    "complexity": "easy"
+},
+
+# Soups and Stews
+"beetroot_soup": {
+    "recipe": [
+        "Step 1: Go to the farm and collect 6 beetroot.",
+        "Step 2: Go to the chest and grab a bowl.",
+        "Step 3: Go to the crafting table and combine the 6 beetroot and 1 bowl to make beetroot soup."
+    ],
+    "description": "A hearty beetroot soup",
+    "complexity": "medium"
+},
+"mushroom_stew": {
+    "recipe": [
+        "Step 1: Go to the farm and collect 1 red mushroom and 1 brown mushroom.",
+        "Step 2: Go to the chest and grab a bowl.",
+        "Step 3: Go to the crafting table and combine both the mushrooms and bowl to make mushroom stew."
+    ],
+    "description": "A warm mushroom stew",
+    "complexity": "medium"
+},
+"rabbit_stew": {
+    "recipe": [
+        "Step 1: Go to the farm and collect 1 carrot, 1 potato, and 1 brown mushroom (search for 'potatoes' (not 'potato').",
+        "Step 2: Go to the furnace and bake the potato.",
+        "Step 3: Go to the chest and grab a bowl",
+        "Step 5: Kill a rabbit and pick up 1 raw rabbit that is dropped.",
+        "Step 6: Go to the furnace and cook the raw rabbit.",
+        "Step 7: Go to the crafting table and combine the cooked rabbit, baked potato, carrot, brown mushroom, and bowl to make rabbit stew."
+    ],
+    "description": "A hearty rabbit stew",
+    "complexity": "hard"
+},
+"suspicious_stew": {
+    "recipe": [
+        "Step 1: Go to the farm and collect 1 red mushroom, 1 brown mushroom.",
+        "Step 2: Go to the chest and grab a bowl and 1 dandelion",
+        "Step 4: Go to the crafting table and combine the mushrooms, dandelion, and bowl to make suspicious stew."
+    ],
+    "description": "A mysterious stew with special effects",
+    "complexity": "medium"
+},
+
+# Baked Goods
+"baked_potato": {
+    "recipe": [
+        "Step 1: Go to the farm and collect 1 potato (search for 'potatoes' (not 'potato')).",
+        "Step 2: Go to the furnace and bake the potato."
+    ],
+    "description": "A simple baked potato",
+    "complexity": "easy"
+},
+"bread": {
+    "recipe": [
+        "Step 1: Go to the farm and collect 3 wheat.",
+        "Step 2: Go to the crafting table and use the wheat to craft bread."
+    ],
+    "description": "Fresh bread",
+    "complexity": "medium"
+},
+"cake": {
+    "recipe": [
+        "Step 1: Go to the farm and collect 3 wheat, 2 sugar cane.",
+        "Step 2: Go to the chest and grab 3 milk buckets (already filled with milk).",
+        "Step 3: Go to the chest and grab an egg.",
+        "Step 4: Go to the crafting table and craft the sugarcane into sugar.",
+        "Step 5: Go to the crafting table and combine all ingredients (3 wheat, 2 sugar, 1 egg, and milk bucket) to make a cake."
+    ],
+    "description": "A delicious cake",
+    "complexity": "hard"
+},
+"cookie": {
+    "recipe": [
+        "Step 1: Go to the farm and collect 2 wheat.",
+        "Step 2: Go to the chest and grab 1 cocoa bean.",
+        "Step 3: Go to the crafting table and combine the wheat and cocoa bean to craft a cookie."
+    ],
+    "description": "Sweet cookies",
+    "complexity": "medium"
+},
+"pumpkin_pie": {
+    "recipe": [
+        "Step 1: Go to the farm and collect 1 pumpkin and 1 sugar cane.",
+        "Step 2: Go to the chest and grab 1 egg.",
+        "Step 3: Go to the crafting table and craft the sugar cane into sugar.",
+        "Step 4: Go to the crafting table and combine the pumpkin, egg, and sugar to make a pumpkin pie."
+    ],
+    "description": "Delicious pumpkin pie",
+    "complexity": "hard"
+},
+
+# Sweet Foods
+"golden_apple": {
+    "recipe": [
+        "Step 1: Go to the chest and collect 1 apple and 8 gold ingots.",
+        "Step 2: Go to the crafting table and surround the apple with the gold ingots to create a golden apple."
+    ],
+    "description": "A magical golden apple",
+    "complexity": "hard"
+},
+
+# Special Foods
+"golden_carrot": {
+    "recipe": [
+        "Step 1: Go to the farm and collect 1 carrot.",
+        "Step 2: Go to the chest and collect gold ingots and convert them to gold nuggets.",
+        "Step 3: Go to the crafting table and surround the carrot with gold nuggets to create a golden carrot."
+    ],
+    "description": "A magical golden carrot",
+    "complexity": "hard"
+},
+
+}
+
+def generate_task_id(task: Dict[str, Any]) -> str:
+    """
+    Generate a standardized task ID based on target items and blocked access.
+    
+    Format: multiagent_cooking_{quantities}_{blocked_info}
+    Examples:
+    - multiagent_cooking_1_cooked_rabbit
+    - multiagent_cooking_1_cooked_rabbit_blocked_access_0
+    - multiagent_cooking_1_cake_1_cookie_blocked_access_0_1
+    
+    Args:
+        task: Task dictionary with target and blocked_access_to_recipe information
+    
+    Returns:
+        Standardized task ID string
+    """
+    # Generate the quantities part (e.g., "1_cake_1_cookie")
+    quantities = []
+    for item, count in sorted(task["target"].items()):
+        quantities.append(f"{count}_{item}")
+    
+    quantities_str = "_".join(quantities)
+    
+    # Generate the blocked access part if any (e.g., "blocked_access_0_1")
+    blocked_str = ""
+    if task["blocked_access_to_recipe"]:
+        # Sort to ensure consistent ordering
+        sorted_blocked = sorted(task["blocked_access_to_recipe"])
+        blocked_str = f"_blocked_access_{'_'.join(sorted_blocked)}"
+    
+    # Combine everything
+    return f"multiagent_cooking_{quantities_str}{blocked_str}"
+
+def generate_hells_kitchen_task_id(task: Dict[str, Any]) -> str:
+    """
+    Generate a standardized task ID for Hell's Kitchen tasks.
+
+    Format: multiagent_cooking_{quantities}_hells_kitchen
+    Examples:
+    - multiagent_cooking_cooked_mutton_cooked_beef_hells_kitchen
+
+    Args:
+        task: Task dictionary with target information
+
+    Returns:
+        Standardized task ID string
+    """
+    # Generate the quantities part (e.g., "cooked_mutton_cooked_beef")
+    quantities = "_".join(task["target"])
+
+    # Combine everything with hells_kitchen suffix
+    return f"multiagent_cooking_{quantities}_hells_kitchen"
+
+def generate_hells_kitchen_task() -> Dict[str, Any]:
+    """Generate a single Hell's Kitchen task where agents have recipes for each other's items."""
+    # Select two different items
+    selected_items = random.sample(list(COOKING_ITEMS.keys()), 2)
+
+    # Assign one item to each agent
+    agent0_target = selected_items[0]
+    agent1_target = selected_items[1]
+
+    # Combined target for the overall task as a list
+    combined_target = [agent0_target, agent1_target]
+
+    # Get recipes for both items
+    recipes = {}
+    for item in selected_items:
+        recipes[item] = COOKING_ITEMS[item]["recipe"]
+
+    # Create different goal strings for each agent
+    goals = {}
+
+    # Agent 0 has the recipe for Agent 1's target item
+    recipe_for_agent1 = "\n".join(recipes[selected_items[1]])
+    goals["0"] = (
+        f"You need to make {selected_items[0]}, but you don't have the recipe for it, your partner has it!\n\n"
+        f"Your partner needs to make {selected_items[1]}. You have their recipe:\n"
+        f"Recipe for {selected_items[1]}:\n{recipe_for_agent1}\n\n"
+        f"You must communicate effectively to exchange recipe information and complete both dishes."
+        f" Note: You can only guide your partner with recipe steps. You cannot help with ingredient collection or cooking."
+    )
+
+    # Agent 1 has the recipe for Agent 0's target item
+    recipe_for_agent0 = "\n".join(recipes[selected_items[0]])
+    goals["1"] = (
+        f"You need to make {selected_items[1]}, but you don't have the recipe for it, your partner has it!\n\n"
+        f"Your partner needs to make {selected_items[0]}. You have their recipe:\n"
+        f"Recipe for {selected_items[0]}:\n{recipe_for_agent0}\n\n"
+        f"You must communicate effectively to exchange recipe information and complete both dishes."
+        f" Note: You can only guide your partner with recipe steps. You cannot help with ingredient collection or cooking."
+    )
+
+    # Create a Hell's Kitchen themed conversation starter
+    conversation = (
+        f"We need to make {selected_items[0]} and {selected_items[1]} together. You are supposed to make {selected_items[1]} and I am supposed to make {selected_items[0]}, "
+        f"but I only have YOUR recipe and you only have access to MY recipe! Let's exchange information and get cooking!"
+    )
+
+    task_data = {
+        "conversation": conversation,
+        "agent_count": 2,
+        "target": combined_target,
+        "type": "cooking",
+        "timeout": 300,
+        "recipes": recipes,
+        "blocked_access_to_recipe": [],  # No blocked access - it's just switched
+        "goal": goals,
+        "task_type": "cooking"  # Mark as Hell's Kitchen task
+    }
+
+    # Generate a Hell's Kitchen task ID
+    task_id = generate_hells_kitchen_task_id(task_data)
+
+    return {task_id: task_data}
+
+def calculate_hells_kitchen_task_difficulty_metrics(task: Dict) -> Dict[str, Any]:
+    """Calculate detailed difficulty metrics for a Hell's Kitchen task."""
+    # Get all recipes
+    recipes = task["recipes"]
+    
+    # Calculate recipe step metrics
+    total_steps = sum(len(steps) for steps in recipes.values())
+    max_steps_per_recipe = max(len(steps) for steps in recipes.values()) if recipes else 0
+    
+    # Get number of target items
+    num_unique_items = len(task["target"])
+    
+    # Calculate overall difficulty score
+    difficulty_score = 0
+    
+    # Add score based on total steps
+    if total_steps <= 4:
+        step_difficulty = 1  # Easy
+    elif total_steps <= 8:
+        step_difficulty = 2  # Medium
+    else:
+        step_difficulty = 3  # Hard
+    
+    difficulty_score += step_difficulty
+    
+    # Add score based on number of items
+    item_difficulty = num_unique_items
+    difficulty_score += item_difficulty
+    
+    # Hell's Kitchen tasks are inherently more difficult due to communication requirements
+    # Add a communication difficulty factor
+    difficulty_score += 1
+    
+    # Determine final difficulty category
+    if difficulty_score <= 3:
+        difficulty_category = "easy"
+    elif difficulty_score <= 5:
+        difficulty_category = "medium"
+    else:
+        difficulty_category = "hard"
+    
+    # Compile all metrics into a dictionary
+    difficulty_metrics = {
+        "total_recipe_steps": total_steps,
+        "max_steps_per_recipe": max_steps_per_recipe,
+        "unique_target_items": num_unique_items,
+        "overall_difficulty_score": difficulty_score,
+        "difficulty_category": difficulty_category
+    }
+    
+    return difficulty_metrics
+
+def generate_maximum_hells_kitchen_tasks(
+    num_train_tasks: int,
+    num_test_tasks: int
+) -> Tuple[Dict[str, Dict], Dict[str, Dict]]:
+    """
+    Generate as many Hell's Kitchen tasks as specified, without balancing difficulty.
+    
+    Args:
+        num_train_tasks: Exact number of training tasks to generate
+        num_test_tasks: Exact number of test tasks to generate
+        
+    Returns:
+        Tuple of (train_tasks, test_tasks)
+    """
+    # Get all available cooking items
+    all_items = list(COOKING_ITEMS.keys())
+    
+    # Fixed test items as specified in your original code
+    hk_test_items = {"cooked_mutton", "baked_potato", "cake", "golden_carrot", "mushroom_stew", "bread"}
+    hk_train_items = set(all_items) - hk_test_items
+    
+    # Set fixed seed for consistent results
+    random.seed(42)
+    
+    # Generate tasks for training set
+    train_tasks = {}
+    while len(train_tasks) < num_train_tasks:
+        task = generate_hells_kitchen_task()
+        task_id, task_data = list(task.items())[0]
+        
+        # Check if task uses valid items for train set
+        task_items = set(task_data["target"])
+        if task_items.issubset(hk_train_items):
+            # Still calculate metrics for information but don't filter by them
+            task_data["difficulty_metrics"] = calculate_hells_kitchen_task_difficulty_metrics(task_data)
+            task_data["difficulty"] = task_data["difficulty_metrics"]["difficulty_category"]
+            train_tasks[task_id] = task_data
+    
+    # Generate tasks for test set
+    test_tasks = {}
+    while len(test_tasks) < num_test_tasks:
+        task = generate_hells_kitchen_task()
+        task_id, task_data = list(task.items())[0]
+        
+        # Check if task uses valid items for test set
+        task_items = set(task_data["target"])
+        if task_items.issubset(hk_test_items):
+            # Still calculate metrics for information but don't filter by them
+            task_data["difficulty_metrics"] = calculate_hells_kitchen_task_difficulty_metrics(task_data)
+            task_data["difficulty"] = task_data["difficulty_metrics"]["difficulty_category"]
+            test_tasks[task_id] = task_data
+    
+    return train_tasks, test_tasks
+
+
+
+def analyze_task_split(train_tasks, test_tasks):
+    """Analyze and print statistics about the train/test split with detailed difficulty metrics."""
+    # Count total tasks
+    train_count = len(train_tasks)
+    test_count = len(test_tasks)
+    
+    # Count difficulty distribution by category
+    train_difficulty = Counter(task["difficulty"] for task in train_tasks.values())
+    test_difficulty = Counter(task["difficulty"] for task in test_tasks.values())
+    
+    # Analyze quantitative difficulty metrics
+    train_metrics = {
+        "total_recipe_steps": [],
+        "unique_target_items": [],
+        "overall_difficulty_score": []
+    }
+    
+    test_metrics = {
+        "total_recipe_steps": [],
+        "unique_target_items": [],
+        "overall_difficulty_score": []
+    }
+    
+    # Collect metrics from tasks
+    for task in train_tasks.values():
+        for metric in train_metrics:
+            if metric in task["difficulty_metrics"]:
+                train_metrics[metric].append(task["difficulty_metrics"][metric])
+    
+    for task in test_tasks.values():
+        for metric in test_metrics:
+            if metric in task["difficulty_metrics"]:
+                test_metrics[metric].append(task["difficulty_metrics"][metric])
+    
+    # Calculate statistics for each metric
+    train_stats = {}
+    test_stats = {}
+    
+    for metric in train_metrics:
+        values = train_metrics[metric]
+        if values:
+            train_stats[metric] = {
+                "min": min(values),
+                "max": max(values),
+                "mean": sum(values) / len(values),
+                "median": sorted(values)[len(values)//2]
+            }
+    
+    for metric in test_metrics:
+        values = test_metrics[metric]
+        if values:
+            test_stats[metric] = {
+                "min": min(values),
+                "max": max(values),
+                "mean": sum(values) / len(values),
+                "median": sorted(values)[len(values)//2]
+            }
+    
+    # Get items in each set
+    train_items = set()
+    test_items = set()
+    
+    for task in train_tasks.values():
+        train_items.update(task["target"])
+    
+    for task in test_tasks.values():
+        test_items.update(task["target"])
+    
+    # Check for item overlap
+    item_overlap = train_items.intersection(test_items)
+    
+    # Compile the results
+    result = {
+        "train_count": train_count,
+        "test_count": test_count,
+        "train_difficulty_categories": dict(train_difficulty),
+        "test_difficulty_categories": dict(test_difficulty),
+        "train_difficulty_metrics": train_stats,
+        "test_difficulty_metrics": test_stats,
+        "train_items": list(train_items),
+        "test_items": list(test_items),
+        "item_overlap": list(item_overlap),
+        "is_valid_items_split": len(item_overlap) == 0
+    }
+    
+    return result
+
+# Example usage
+if __name__ == "__main__":
+    hk_train_tasks, hk_test_tasks = generate_maximum_hells_kitchen_tasks(
+        num_train_tasks=90,
+        num_test_tasks=30
+    )
+    
+    # Save Hell's Kitchen tasks to separate files
+    with open("hells_kitchen_train_tasks.json", "w") as f:
+        json.dump(hk_train_tasks, f, indent=2)
+    
+    with open("hells_kitchen_test_tasks.json", "w") as f:
+        json.dump(hk_test_tasks, f, indent=2)
+    
+    # Print counts
+    print(f"Generated {len(hk_train_tasks)} training tasks")
+    print(f"Generated {len(hk_test_tasks)} test tasks")
+    
+    # You can still analyze the distribution if interested
+    hk_analysis = analyze_task_split(hk_train_tasks, hk_test_tasks)
+    print("\nHell's Kitchen Tasks Analysis:")
+    print(json.dumps(hk_analysis, indent=2))