diff --git a/amnesia_bench.py b/amnesia_bench.py index e106d73..0ce6aaf 100644 --- a/amnesia_bench.py +++ b/amnesia_bench.py @@ -1,18 +1,44 @@ #!/usr/bin/env python3 +# Author: Claude Sonnet 4.6 (Bubba) +# Date: 28-March-2026 +# PURPOSE: AmnesiaBench v2 — multi-model, multi-problem benchmark runner that binary-searches +# for the minimum context window (n_reliable) at which each LLM can solve competition-math +# problems at 60% success rate. Supports 10 problems × N models for overnight runs. +# Features: prediction phase, composite Scott scoring, --model / --model-name flags, +# --run-all-models mode reading models.json, per-model result namespacing, full scoring table. +# Supports llama.cpp (http://), Google Gemini (gemini://), OpenRouter (openrouter://), +# and Anthropic OAuth (anthropic://) backends via create_client(). +# ARC puzzle support: uses arc_evaluator for grid answer evaluation, arc_prompts for system prompts. +# Exponential backoff applied to all external API calls (429/503 retry with jitter). +# Integration points: run_prediction_phase() → run_problem() → binary_search() → run_trial(). +# SRP/DRY check: Pass — prediction phase, scoring, model iteration all isolated. No duplication +# of result I/O. calculate_scores() is the single scoring engine. run_all_models() delegates +# to run_problem() so the multi-model path is just a loop around the single-model path. +# with_exponential_backoff() is the single retry engine used by both LLMClient and GeminiClient. """ -AmnesiaBench — How much context does a model actually need? +AmnesiaBench v2 — How much context does a model actually need? Binary-searches (log scale) for the minimum context window at which an LLM -can solve competition-math problems at a 20% success rate. - -4 configurations: {TIR, No-TIR} x {Hard Cutoff, Compaction} -5 trials per window size. Full conversation traces saved. +can solve competition-math problems at a 60% success rate. Runs prediction +phase, computes composite Scott scores, supports multi-model overnight runs. +Supports both llama.cpp (http://) and Google Gemini (gemini://) backends. Usage: - # Start llama.cpp server first, then: - python3 amnesia_bench.py --problem ab507a9f - python3 amnesia_bench.py --all + # Single problem, single model (llama.cpp): + python3 amnesia_bench.py --problem ab507a9f --model http://localhost:8080 --model-name Qwen35B + + # All problems, single model: + python3 amnesia_bench.py --all --model http://localhost:8080 --model-name Qwen35B + + # All problems, Gemini: + python3 amnesia_bench.py --all --model gemini://gemini-2.0-flash-lite --api-key $GEMINI_API_KEY + + # All problems, all models from models.json: + python3 amnesia_bench.py --all --run-all-models + + # Analysis: python3 amnesia_bench.py --analyze + python3 amnesia_bench.py --scores """ import argparse @@ -22,6 +48,7 @@ import json import math import os +import random import re import signal import sys @@ -31,25 +58,58 @@ from dataclasses import dataclass, field, asdict from datetime import datetime, timezone from pathlib import Path -from typing import Optional +from typing import Optional, Union import requests +from arc.arc_evaluator import evaluate_arc_answer +from arc.arc_prompts import ARC_SYSTEM_PROMPT + # ─── Defaults ──────────────────────────────────────────────────────────────── SERVER_URL = "http://localhost:8080" -MIN_WINDOW = 512 +MIN_WINDOW = 1 MAX_WINDOW = 32768 -TRIALS_PER_WINDOW = 5 -SUCCESS_THRESHOLD = 0.2 # 1/5 = 20% -CONVERGENCE_RATIO = 1.05 # stop when hi/lo < 5% -MAX_COMPACTIONS = 5 -COMPACTION_TRIGGER = 0.70 # compact at 70% of budget -MAX_TURNS = 40 # safety: max conversation turns -CODE_TIMEOUT = 30 # seconds per code execution +TRIALS_PER_WINDOW = 1 +SUCCESS_THRESHOLD = 0.6 # 60% +CONVERGENCE_RATIO = 1.05 # stop when hi/lo < 5% (fallback) +CONVERGENCE_ABS = 50 # stop when hi - lo < 50 tokens (primary) +MAX_COMPLETION_TOKENS = 16384 # hard cap per generation turn +MAX_COMPACTIONS = 10 +COMPACTION_TRIGGER = 0.70 +MAX_TURNS = 40 +CODE_TIMEOUT = 30 TEMPERATURE = 0.7 PROBLEMS_DIR = Path(__file__).parent / "problems" RESULTS_DIR = Path(__file__).parent / "results" +MODELS_JSON = Path(__file__).parent / "models.json" + +# ─── Model Context Window Registry ─────────────────────────────────────────── + +MODEL_CONTEXT_WINDOWS = { + "claude-sonnet-4.6": 200000, + "deepseek-v3.2": 65536, + "gemini-2.5-flash-lite": 1048576, + "gemini-3.1-flash-lite-preview": 1048576, + "gemini-3.1-pro-preview": 1048576, + "mistral-small-2603": 32768, + "openai/gpt-oss-20b": 128000, + "qwen/qwen3.6-plus-preview": 131072, + "glm-4.6v-flash": 128000, +} +DEFAULT_CONTEXT_WINDOW = 32768 # fallback if model not in mapping + + +def get_model_context_window(model_name: str) -> int: + """Return the known context window for a model, falling back to DEFAULT_CONTEXT_WINDOW.""" + return MODEL_CONTEXT_WINDOWS.get(model_name, DEFAULT_CONTEXT_WINDOW) + + +DEFAULT_COMPACTION_PROMPT = "Compact your context window to continue." + +SYSTEM_UNBOUNDED = """You are solving a problem. Show your work step by step. +Provide your final answer in \\boxed{}. +You may write and execute Python code to help.""" # ─── Prompt Templates ──────────────────────────────────────────────────────── @@ -84,6 +144,27 @@ --- Continue solving. Give your final answer as \\boxed{{integer}}.""" +PREDICTION_PROMPT = """\ +You are about to solve a math problem under context window constraints. + +--- PROBLEM --- +{problem_text} + +--- SCORING --- +Your score depends on: +- n_reliable: minimum context window where you solve this 60%+ of the time +- n_reliable_prediction: your prediction of n_reliable (before we test) +- Lower n_reliable_prediction = better score IF correct; if too low and you fail = infinity penalty +- success_prediction: whether you can solve this at all + +You may opt out (success_prediction=False) if you think you cannot solve this problem. + +--- INSTRUCTIONS --- +Respond in 300 tokens or less. Include these tags: +True or False +integer (tokens) +one sentence describing what to preserve when compacting""" + # ─── Python Sandbox ────────────────────────────────────────────────────────── @@ -124,63 +205,138 @@ def reset(self): self.namespace = {"__builtins__": __builtins__} +# ─── Exponential Backoff ───────────────────────────────────────────────────── + +def with_exponential_backoff(fn, max_retries=20, base_delay=2.0, max_delay=120.0): + """ + Wrap any API call with exponential backoff on 429/503 errors. + Respects Retry-After header when present. + Uses full jitter: delay = min(base * 2^attempt + uniform(0,1), max_delay). + Raises immediately on non-retriable errors or when retries are exhausted. + """ + for attempt in range(max_retries): + try: + return fn() + except requests.HTTPError as e: + if e.response.status_code in (429, 503) and attempt < max_retries - 1: + # Respect Retry-After header if present + retry_after = e.response.headers.get("Retry-After") or e.response.headers.get("x-ratelimit-reset-requests") + if retry_after: + try: + delay = float(retry_after) + except ValueError: + delay = min(base_delay * (2 ** attempt) + random.uniform(0, 2), max_delay) + else: + delay = min(base_delay * (2 ** attempt) + random.uniform(0, 2), max_delay) + print(f" [backoff] {e.response.status_code} — retrying in {delay:.1f}s (attempt {attempt+1}/{max_retries})") + time.sleep(delay) + else: + raise + + # ─── LLM Client ───────────────────────────────────────────────────────────── class LLMClient: - """Wrapper for llama.cpp /v1/chat/completions.""" + """Wrapper for llama.cpp or any OpenAI-compatible /v1/chat/completions endpoint.""" - def __init__(self, server_url: str = SERVER_URL, temperature: float = TEMPERATURE): + def __init__(self, server_url: str = SERVER_URL, temperature: float = TEMPERATURE, api_key: str = None, model_name: str = None): self.server_url = server_url.rstrip("/") self.temperature = temperature + self.model_name = model_name # passed to API as model field (required by OpenRouter) + self.auth_header = {"Authorization": f"Bearer {api_key}"} if api_key else {} def generate(self, messages: list[dict], max_tokens: int) -> dict: """ - Send messages to the model. Returns: - { - "content": str, - "prompt_tokens": int, - "completion_tokens": int, - "total_tokens": int, - "finish_reason": str, - } + Send messages to the model. Returns usage + content dict. + Uses exponential backoff on 429/503 errors. """ max_tokens = max(1, max_tokens) payload = { "messages": messages, "max_tokens": max_tokens, "temperature": self.temperature, - "stream": False, + "stream": True, } - resp = requests.post( - f"{self.server_url}/v1/chat/completions", - json=payload, - timeout=3600, # 1 hour — large windows with parallel slots are slow - ) - resp.raise_for_status() - data = resp.json() - choice = data["choices"][0] - usage = data.get("usage", {}) - msg = choice["message"] - # Qwen3.5 splits thinking into reasoning_content, final answer into content - reasoning = msg.get("reasoning_content", "") or "" - content = msg.get("content", "") or "" - # Combine both for our purposes — the model's full output + + def _do_request(): + if self.model_name: + payload["model"] = self.model_name + headers = dict(self.auth_header) + # Enable prompt caching for OpenRouter (reduces cost + latency on repeated prompts) + if "openrouter.ai" in self.server_url: + headers["X-OpenRouter-Cache"] = "true" + resp = requests.post( + f"{self.server_url}/v1/chat/completions", + headers=headers, + json=payload, + timeout=3600, + stream=True, + ) + resp.raise_for_status() + return resp + + resp = with_exponential_backoff(_do_request) + full_content = "" + reasoning = "" + content = "" + prompt_tokens = 0 + completion_tokens = 0 + total_tokens = 0 + finish_reason = "unknown" + + print(" [stream] ", end="", flush=True) + for line in resp.iter_lines(): + if not line: + continue + line = line.decode("utf-8") if isinstance(line, bytes) else line + if line.startswith("data: "): + line = line[6:] + if line == "[DONE]": + break + try: + chunk = json.loads(line) + except json.JSONDecodeError: + continue + choice = chunk.get("choices", [{}])[0] + delta = choice.get("delta", {}) + r_piece = delta.get("reasoning_content", "") or delta.get("reasoning", "") or "" + c_piece = delta.get("content", "") or "" + if r_piece: + reasoning += r_piece + sys.stdout.write(r_piece) + sys.stdout.flush() + if c_piece: + content += c_piece + sys.stdout.write(c_piece) + sys.stdout.flush() + finish_reason = choice.get("finish_reason") or finish_reason + usage = chunk.get("usage", {}) + if usage: + prompt_tokens = usage.get("prompt_tokens", prompt_tokens) + completion_tokens = usage.get("completion_tokens", completion_tokens) + total_tokens = usage.get("total_tokens", total_tokens) + print() + if reasoning: - full_content += f"\n{reasoning}\n\n" - full_content += content + full_content = f"\n{reasoning}\n\n{content}" + else: + full_content = content return { "content": full_content, "reasoning_content": reasoning, "final_content": content, - "prompt_tokens": usage.get("prompt_tokens", 0), - "completion_tokens": usage.get("completion_tokens", 0), - "total_tokens": usage.get("total_tokens", 0), - "finish_reason": choice.get("finish_reason", "unknown"), + "prompt_tokens": prompt_tokens, + "completion_tokens": completion_tokens, + "total_tokens": total_tokens, + "finish_reason": finish_reason, } def ping(self) -> bool: + # For remote APIs (OpenRouter, etc.) skip /health check — just assume reachable + if "openrouter.ai" in self.server_url or "localhost" not in self.server_url and not self.server_url.startswith("http://192."): + return True try: r = requests.get(f"{self.server_url}/health", timeout=5) return r.status_code == 200 @@ -188,16 +344,309 @@ def ping(self) -> bool: return False +# ─── Gemini Client ─────────────────────────────────────────────────────────── + +class GeminiClient: + """Client for Google Gemini API (gemini-2.0-flash-lite or similar). + + Accepts OpenAI-style message lists and converts them to Gemini's + generateContent format. Returns the same dict shape as LLMClient.generate() + so the rest of the benchmark code is backend-agnostic. + """ + + def __init__( + self, + api_key: str, + model: str = "gemini-2.0-flash-lite", + temperature: float = TEMPERATURE, + ): + self.api_key = api_key + self.model = model + self.temperature = temperature + self.base_url = "https://generativelanguage.googleapis.com/v1beta" + + def _convert_messages(self, messages: list[dict]) -> tuple[Optional[dict], list[dict]]: + """Convert OpenAI-style messages to Gemini format. + + Returns (system_instruction, contents) where: + - system_instruction is None or {"parts": [{"text": "..."}]} + - contents is a list of {"role": "user"|"model", "parts": [{"text": "..."}]} + """ + system_instruction = None + contents = [] + + for msg in messages: + role = msg.get("role", "user") + text = msg.get("content", "") + + if role == "system": + system_instruction = {"parts": [{"text": text}]} + elif role == "assistant": + contents.append({"role": "model", "parts": [{"text": text}]}) + else: + contents.append({"role": "user", "parts": [{"text": text}]}) + + return system_instruction, contents + + def generate(self, messages: list[dict], max_tokens: int) -> dict: + """ + Send messages to Gemini generateContent endpoint. + Returns same dict format as LLMClient: content, prompt_tokens, + completion_tokens, total_tokens, finish_reason. + Uses exponential backoff on 429/503 errors. + """ + max_tokens = max(1, max_tokens) + system_instruction, contents = self._convert_messages(messages) + + payload = { + "contents": contents, + "generationConfig": { + "maxOutputTokens": max_tokens, + "temperature": self.temperature, + }, + } + if system_instruction is not None: + payload["systemInstruction"] = system_instruction + + url = ( + f"{self.base_url}/models/{self.model}:generateContent" + f"?key={self.api_key}" + ) + + def _do_request(): + resp = requests.post(url, json=payload, timeout=3600) + resp.raise_for_status() + return resp + + resp = with_exponential_backoff(_do_request) + data = resp.json() + + # Parse response + candidates = data.get("candidates", []) + if candidates: + candidate = candidates[0] + parts = candidate.get("content", {}).get("parts", []) + content = "".join(p.get("text", "") for p in parts) + finish_reason_raw = candidate.get("finishReason", "STOP") + # Normalise Gemini finish reasons to llama.cpp style + finish_reason_map = { + "STOP": "stop", + "MAX_TOKENS": "length", + "SAFETY": "stop", + "RECITATION": "stop", + "OTHER": "stop", + } + finish_reason = finish_reason_map.get(finish_reason_raw, "stop") + else: + content = "" + finish_reason = "stop" + + usage = data.get("usageMetadata", {}) + prompt_tokens = usage.get("promptTokenCount", 0) + completion_tokens = usage.get("candidatesTokenCount", 0) + total_tokens = usage.get("totalTokenCount", prompt_tokens + completion_tokens) + + # Print a brief stream-alike indicator for consistency + print(f" [gemini] {completion_tokens} tokens | finish={finish_reason}") + print(content[:120].replace("\n", " ") + ("..." if len(content) > 120 else "")) + + return { + "content": content, + "reasoning_content": "", + "final_content": content, + "prompt_tokens": prompt_tokens, + "completion_tokens": completion_tokens, + "total_tokens": total_tokens, + "finish_reason": finish_reason, + } + + def ping(self) -> bool: + """Health check — try a minimal generation.""" + try: + resp = self.generate( + messages=[{"role": "user", "content": "Say OK."}], + max_tokens=100, + ) + return bool(resp.get("content") or resp.get("final_content")) + except Exception: + return False + + +# ─── Anthropic OAuth Client ────────────────────────────────────────────────── + +class AnthropicOAuthClient: + """Client for Anthropic API using OAuth tokens (sk-ant-oat prefix). + + Uses ANTHROPIC_OAUTHTOKEN env var. Requires anthropic-beta header. + System prompt is always "You are Claude Code, Anthropic's official CLI for Claude." + ARC/AIMO strategies go in the user message, NOT in system. + Does NOT pass temperature parameter (omit entirely — 0.0 gets rejected). + """ + + FIXED_SYSTEM = "You are Claude Code, Anthropic's official CLI for Claude." + + def __init__(self, model: str = "claude-sonnet-4-6"): + self.model = model + self.token = os.environ.get("ANTHROPIC_OAUTHTOKEN") + if not self.token: + raise ValueError( + "AnthropicOAuthClient requires ANTHROPIC_OAUTHTOKEN env var (sk-ant-oat prefix)." + ) + self.base_url = "https://api.anthropic.com/v1/messages" + + def generate(self, messages: list[dict], max_tokens: int) -> dict: + """Send messages to Anthropic messages API. Returns same dict shape as LLMClient.""" + max_tokens = max(1, max_tokens) + + # Convert OpenAI-style messages to Anthropic format. + # System goes in top-level 'system' field, not in messages array. + anthropic_messages = [] + for msg in messages: + role = msg.get("role", "user") + text = msg.get("content", "") + if role == "system": + # Skip — we use fixed system prompt + continue + elif role == "assistant": + anthropic_messages.append({"role": "assistant", "content": text}) + else: + anthropic_messages.append({"role": "user", "content": text}) + + payload = { + "model": self.model, + "max_tokens": max_tokens, + "system": self.FIXED_SYSTEM, + "messages": anthropic_messages, + # NOTE: temperature intentionally omitted — 0.0 gets rejected by Anthropic + } + + headers = { + "Authorization": f"Bearer {self.token}", + "anthropic-version": "2023-06-01", + "anthropic-beta": "oauth-2025-04-20", + "content-type": "application/json", + } + + def _do_request(): + resp = requests.post( + self.base_url, + headers=headers, + json=payload, + timeout=3600, + ) + resp.raise_for_status() + return resp + + resp = with_exponential_backoff(_do_request) + data = resp.json() + + # Extract text from content[0].text + content_blocks = data.get("content", []) + content = "" + for block in content_blocks: + if block.get("type") == "text": + content += block.get("text", "") + + usage = data.get("usage", {}) + prompt_tokens = usage.get("input_tokens", 0) + completion_tokens = usage.get("output_tokens", 0) + total_tokens = prompt_tokens + completion_tokens + + stop_reason = data.get("stop_reason", "end_turn") + finish_reason_map = { + "end_turn": "stop", + "max_tokens": "length", + "stop_sequence": "stop", + } + finish_reason = finish_reason_map.get(stop_reason, "stop") + + print(f" [anthropic] {completion_tokens} tokens | finish={finish_reason}") + print(content[:120].replace("\n", " ") + ("..." if len(content) > 120 else "")) + + return { + "content": content, + "reasoning_content": "", + "final_content": content, + "prompt_tokens": prompt_tokens, + "completion_tokens": completion_tokens, + "total_tokens": total_tokens, + "finish_reason": finish_reason, + } + + def ping(self) -> bool: + """Health check — try a minimal generation.""" + try: + resp = self.generate( + messages=[{"role": "user", "content": "Say OK."}], + max_tokens=10, + ) + return bool(resp.get("content")) + except Exception: + return False + + +# ─── Client Factory ────────────────────────────────────────────────────────── + +def create_client( + server_url: str, + api_key: str = None, + model_name: str = None, + temperature: float = TEMPERATURE, +) -> Union[LLMClient, GeminiClient]: + """ + Create appropriate client based on server_url scheme. + + - gemini:// or google:// → GeminiClient + model extracted from the URL path (e.g. gemini://gemini-2.0-flash-lite) + - http:// or https:// → LLMClient (llama.cpp) + + api_key is required for GeminiClient. Raises ValueError if missing. + """ + if server_url.startswith("gemini://") or server_url.startswith("google://"): + # Extract model from URL: gemini://gemini-2.0-flash-lite → gemini-2.0-flash-lite + scheme = "gemini://" if server_url.startswith("gemini://") else "google://" + gemini_model = server_url[len(scheme):].strip("/") or "gemini-2.0-flash-lite" + # Allow model_name override + if model_name and not model_name.startswith("gemini"): + # model_name is just a label — still use gemini_model for the actual API call + pass + if not api_key: + raise ValueError( + "GeminiClient requires an API key. Pass --api-key or set GEMINI_API_KEY env var." + ) + return GeminiClient(api_key=api_key, model=gemini_model, temperature=temperature) + elif server_url.startswith("openrouter://"): + # openrouter://openai/gpt-oss-120b:free → https://openrouter.ai/api/v1 + or_model = server_url[len("openrouter://"):].strip("/") + if not api_key: + raise ValueError("OpenRouter requires an API key. Pass --api-key or set api_key_env.") + return LLMClient( + server_url="https://openrouter.ai/api", + temperature=temperature, + api_key=api_key, + model_name=or_model, + ) + elif server_url.startswith("anthropic://"): + # anthropic://claude-sonnet-4-6 → model = claude-sonnet-4-6 + anthropic_model = server_url[len("anthropic://"):].strip("/") or "claude-sonnet-4-6" + return AnthropicOAuthClient(model=anthropic_model) + elif server_url.startswith("http"): + return LLMClient(server_url=server_url, temperature=temperature) + else: + raise ValueError( + f"Unrecognised server URL scheme: '{server_url}'. " + "Use http://, https://, openrouter://, anthropic://, gemini://, or google://" + ) + + # ─── Parsing Helpers ───────────────────────────────────────────────────────── def extract_python_blocks(text: str) -> list[str]: - """Extract all ```python code blocks from text.""" pattern = r"```python\s*\n(.*?)```" return re.findall(pattern, text, re.DOTALL) def extract_compact_call(text: str) -> Optional[str]: - """Extract ... summary. Returns None if not found.""" match = re.search(r"(.*?)", text, re.DOTALL) if match: return match.group(1).strip() @@ -206,31 +655,26 @@ def extract_compact_call(text: str) -> Optional[str]: def extract_boxed_answer(text: str) -> Optional[int]: """Extract the last \\boxed{...} answer from text, ignoring blocks.""" - # Try outside blocks first non_think = re.sub(r".*?", "", text, flags=re.DOTALL) target = non_think if non_think.strip() else text matches = re.findall(r"\\boxed\{([^{}]+)\}", target) if not matches: - # Fallback: try nested braces matches = re.findall(r"\\boxed\{(.+?)\}", target) if not matches: return None raw = matches[-1].strip() - # Try direct int parse try: return int(raw) except ValueError: pass - # Try float -> int try: f = float(raw) if f == int(f): return int(f) except ValueError: pass - # Try simple eval (e.g. "2^10" or "3*5") try: cleaned = raw.replace("^", "**").replace(",", "") return int(eval(cleaned)) @@ -239,112 +683,457 @@ def extract_boxed_answer(text: str) -> Optional[int]: return None -# ─── Single Trial (one attempt at solving a problem) ───────────────────────── +# ─── Prediction Phase ──────────────────────────────────────────────────────── + +def run_prediction_phase( + client, + problem: dict, + max_tokens: int = 300, +) -> dict: + """ + Ask the model to predict its own performance before testing begins. + Returns parsed prediction dict with keys: success_prediction, n_reliable_prediction, + compaction_prompt, raw_response. Falls back to safe defaults on parse failure. + """ + problem_text = problem.get("problem_text", "") + prompt = PREDICTION_PROMPT.format(problem_text=problem_text) + messages = [{"role": "user", "content": prompt}] + + print(f"\n [Prediction Phase] Asking model to predict performance...") + try: + resp = client.generate(messages, max_tokens=max_tokens) + except Exception as e: + print(f" [Prediction Phase] API error: {e} — using defaults") + return _prediction_defaults(raw_response=f"ERROR: {e}") + + raw = resp.get("content", "") + completion_tokens = resp.get("completion_tokens", 0) + + if completion_tokens > max_tokens: + print(f" [Prediction Phase] Response too long ({completion_tokens} > {max_tokens}) — using defaults") + return _prediction_defaults(raw_response=raw) + + success_match = re.search( + r"\s*(True|False)\s*", + raw, re.IGNORECASE + ) + if not success_match: + print(" [Prediction Phase] Missing tag — using defaults") + return _prediction_defaults(raw_response=raw) + success_prediction = success_match.group(1).strip().lower() == "true" + + n_reliable_match = re.search( + r"\s*(\d+)\s*", + raw + ) + if not n_reliable_match: + print(" [Prediction Phase] Missing tag — using defaults") + return _prediction_defaults(raw_response=raw) + n_reliable_prediction = int(n_reliable_match.group(1)) + + compaction_match = re.search( + r"(.*?)", + raw, re.DOTALL + ) + if not compaction_match: + print(" [Prediction Phase] Missing tag — using defaults") + return _prediction_defaults(raw_response=raw) + compaction_prompt = compaction_match.group(1).strip() or DEFAULT_COMPACTION_PROMPT + + print(f" [Prediction Phase] success={success_prediction}, n_reliable={n_reliable_prediction}, compaction='{compaction_prompt[:60]}'") + + return { + "success_prediction": success_prediction, + "n_reliable_prediction": n_reliable_prediction, + "compaction_prompt": compaction_prompt, + "raw_response": raw, + } + + +def _prediction_defaults(raw_response: str = "") -> dict: + """Return safe prediction defaults (n_reliable=None means infinity).""" + return { + "success_prediction": True, + "n_reliable_prediction": None, + "compaction_prompt": DEFAULT_COMPACTION_PROMPT, + "raw_response": raw_response, + } + + +# ─── Scoring Engine ────────────────────────────────────────────────────────── + +def calculate_scores(results_dir: Optional[Path] = None) -> None: + """ + Load all per-model result files and compute Scott's composite benchmark scores. + + Scott's formula: + Per-problem score: + problem_score = baseline_n_reliable / n_reliable + prediction_score = baseline_n_reliable_prediction / n_reliable_prediction + + Where baseline = lowest n_reliable (or n_reliable_prediction) across all models + that solved that problem (i.e. the best-performing model sets the baseline). + + Composite scores: + composite = mean(problem_scores over all solved problems) + prediction_composite = mean(prediction_scores over all problems) + + Coverage = problems_attempted / problems_eligible + eligible = problems where model context_max >= baseline_n_reliable + + Accuracy = problems_solved / problems_attempted + + Prediction accuracy = correct_success_predictions / total_problems + (correct = predicted True and solved, OR predicted False and unsolvable) + + Final score = composite * prediction_composite * coverage * accuracy + * prediction_accuracy * 10000 + + NOTE: FLOPs not tracked yet — omitted from scoring, noted in output. + + Prints both a per-problem table and a per-model composite score table. + """ + if results_dir is None: + results_dir = RESULTS_DIR + results_dir = Path(results_dir) + + # ── Load all per-config result files (not summary files) ── + # File naming: results/{model_name}_{problem_id}_{config}.json + # or legacy: results/{problem_id}_{config}.json (no model prefix) + result_files = sorted(results_dir.glob("*.json")) + result_files = [f for f in result_files if not f.name.endswith("_summary.json")] + + if not result_files: + print("No result files found. Run experiments first.") + return + + # Structure: {model_name: {problem_id: {config_name: result_dict}}} + by_model: dict[str, dict[str, dict[str, dict]]] = {} + + for rf in result_files: + try: + data = json.loads(rf.read_text()) + except Exception as e: + print(f" [scores] Could not read {rf.name}: {e}") + continue + + model_name = data.get("model_name") or data.get("model") or "unknown" + pid = data.get("problem_id", rf.stem) + config = data.get("config", {}) + config_name = config.get("name", "unknown") if isinstance(config, dict) else str(config) + + by_model.setdefault(model_name, {}).setdefault(pid, {})[config_name] = data + + if not by_model: + print("No parseable result files found.") + return + + all_problem_ids = sorted({pid for m in by_model.values() for pid in m}) + + # ── Load fixed baselines from problem JSON files (gptoss_120b_correct_token_avg) ── + # This is the GPT-4o 120B reference — fixed, not dynamic across models. + # Using a fixed baseline ensures scores are stable and comparable across runs. + baseline_n_reliable: dict[str, Optional[int]] = {} + baseline_n_pred: dict[str, Optional[int]] = {} + + problems_dir = Path(__file__).parent / "problems" + for pid in all_problem_ids: + prob_file = problems_dir / f"{pid}.json" + if prob_file.exists(): + try: + prob_data = json.loads(prob_file.read_text()) + token_avg = prob_data.get("gptoss_120b_correct_token_avg") + if token_avg is not None: + baseline_n_reliable[pid] = int(token_avg) + baseline_n_pred[pid] = int(token_avg) + else: + baseline_n_reliable[pid] = None + baseline_n_pred[pid] = None + except Exception: + baseline_n_reliable[pid] = None + baseline_n_pred[pid] = None + else: + baseline_n_reliable[pid] = None + baseline_n_pred[pid] = None + + # ── Per-problem detail table ── + print(f"\n{'='*110}") + print(f" AmnesiaBench v2 — Per-Problem Detail") + print(f"{'='*110}") + print(f"{'Model':<25} {'Problem':<28} {'Config':<22} {'MinWin':>7} {'Baseline':>8} {'ProbScore':>10} {'N_Pred':>8} {'PredScore':>10}") + print(f"{'-'*110}") + + # ── Per-model composite score computation ── + model_scores = {} + + for model_name in sorted(by_model.keys()): + model_data = by_model[model_name] + problem_scores = [] + prediction_scores = [] + total_problems = len(all_problem_ids) + problems_attempted = 0 + problems_solved = 0 + problems_eligible = 0 + correct_success_preds = 0 + + for pid in all_problem_ids: + if pid not in model_data: + continue + + baseline = baseline_n_reliable.get(pid) + base_pred = baseline_n_pred.get(pid) + + # Count as eligible if baseline exists (some model solved it) + if baseline is not None: + problems_eligible += 1 + + # Use the best config for this problem (lowest minimum_window) + configs_for_pid = model_data[pid] + best_result = None + best_mw = None + for config_name, result in configs_for_pid.items(): + mw = result.get("minimum_window") + if mw is not None: + if best_mw is None or mw < best_mw: + best_mw = mw + best_result = result + + if best_result is None: + # Model didn't solve this problem in any config + pred = list(configs_for_pid.values())[0].get("prediction", {}) or {} + success_pred = pred.get("success_prediction", True) + if not success_pred and baseline is None: + correct_success_preds += 1 # correctly predicted failure + # Still attempted + problems_attempted += 1 + continue + + problems_attempted += 1 + problems_solved += 1 + + # Problem score + if baseline is not None and best_mw is not None: + prob_score = baseline / best_mw + else: + prob_score = 0.0 + problem_scores.append(prob_score) + + # Prediction score + pred = best_result.get("prediction", {}) or {} + n_pred_val = pred.get("n_reliable_prediction") + success_pred = pred.get("success_prediction", True) + + if success_pred: + correct_success_preds += 1 # correctly predicted success (and solved) + + if n_pred_val is not None and base_pred is not None and n_pred_val > 0: + pred_score = base_pred / n_pred_val + else: + pred_score = 0.0 + prediction_scores.append(pred_score) + + prob_score_str = f"{prob_score:.3f}" + pred_score_str = f"{pred_score:.3f}" if n_pred_val is not None else "N/A" + baseline_str = str(baseline) if baseline is not None else "N/A" + n_pred_str = str(n_pred_val) if n_pred_val is not None else "inf" + + # Use config name from best result + cfg = best_result.get("config", {}) + cfg_name = cfg.get("name", "unknown") if isinstance(cfg, dict) else str(cfg) + + print( + f"{model_name:<25} {pid:<28} {cfg_name:<22} {str(best_mw):>7} " + f"{baseline_str:>8} {prob_score_str:>10} {n_pred_str:>8} {pred_score_str:>10}" + ) + + # ── Composite scores ── + composite = sum(problem_scores) / len(problem_scores) if problem_scores else 0.0 + pred_composite = sum(prediction_scores) / len(prediction_scores) if prediction_scores else 0.0 + # Coverage: fraction of eligible problems the model attempted (capped at 1.0) + coverage = min(1.0, problems_solved / problems_eligible) if problems_eligible > 0 else 0.0 + accuracy = problems_solved / problems_attempted if problems_attempted > 0 else 0.0 + pred_accuracy = correct_success_preds / total_problems if total_problems > 0 else 0.0 + + final_score = composite * pred_composite * coverage * accuracy * pred_accuracy * 10000 + + model_scores[model_name] = { + "composite": composite, + "pred_composite": pred_composite, + "coverage": coverage, + "accuracy": accuracy, + "pred_accuracy": pred_accuracy, + "final_score": final_score, + "problems_attempted": problems_attempted, + "problems_solved": problems_solved, + "problems_eligible": problems_eligible, + "total_problems": total_problems, + } + + # ── Per-model composite table ── + print(f"\n{'='*100}") + print(f" AmnesiaBench v2 — Composite Scores (Scott's Formula)") + print(f" NOTE: FLOPs not tracked — omitted from scoring.") + print(f"{'='*100}") + print(f"{'Model':<25} {'Composite':>10} {'PredComp':>10} {'Coverage':>9} {'Accuracy':>9} {'PredAcc':>8} {'FinalScore':>12}") + print(f"{'-'*100}") + + for model_name in sorted(model_scores.keys()): + s = model_scores[model_name] + print( + f"{model_name:<25} " + f"{s['composite']:>10.4f} " + f"{s['pred_composite']:>10.4f} " + f"{s['coverage']:>9.3f} " + f"{s['accuracy']:>9.3f} " + f"{s['pred_accuracy']:>8.3f} " + f"{s['final_score']:>12.2f}" + ) + print(f"{'='*100}") + print(f"\nFormula: final_score = composite × pred_composite × coverage × accuracy × pred_accuracy × 10000") + print(f" composite = mean(baseline_n_reliable / model_n_reliable) over solved problems") + print(f" pred_composite = mean(baseline_n_pred / model_n_pred) over all problems") + print(f" coverage = attempted / eligible (eligible: baseline exists for problem)") + print(f" accuracy = solved / attempted") + print(f" pred_accuracy = correct_success_predictions / total_problems\n") + + +# ─── Single Trial ───────────────────────────────────────────────────────────── @dataclass class Turn: - """One turn in the conversation.""" - role: str # "system", "user", "assistant" + role: str content: str - tokens: Optional[int] = None # completion_tokens (assistant only) - prompt_tokens: Optional[int] = None # prompt_tokens at this point - total_tokens: Optional[int] = None # total context at this point + tokens: Optional[int] = None + prompt_tokens: Optional[int] = None + total_tokens: Optional[int] = None finish_reason: Optional[str] = None - code_executed: Optional[str] = None # code that was run (if any) - code_output: Optional[str] = None # output from code (if any) - compact_summary: Optional[str] = None # summary extracted (if compact call) + code_executed: Optional[str] = None + code_output: Optional[str] = None + compact_summary: Optional[str] = None + forced_compact: bool = False @dataclass class TrialResult: - """Full result of one trial.""" problem_id: str - correct_answer: int + correct_answer: object # int for math, list for ARC token_limit: int tir: bool compaction: bool trial_idx: int success: bool - answer: Optional[int] - total_tokens_peak: int # peak total_tokens seen + answer: object # Optional[int] for math, str marker for ARC + total_tokens_peak: int n_turns: int n_compactions: int n_code_calls: int n_code_errors: int wall_time_s: float error: Optional[str] - finish_reason: str # "solved", "truncated", "budget_exceeded", "max_turns", "error" - conversation: list = field(default_factory=list) # list of Turn dicts + finish_reason: str + conversation: list = field(default_factory=list) def run_trial( - client: LLMClient, + client, problem_id: str, problem_text: str, - correct_answer: int, + correct_answer, token_limit: int, tir: bool, compaction: bool, trial_idx: int, + compaction_hint: str = "", + topic: str = "math", + system_prompt_override: str = None, ) -> TrialResult: - """Run one trial: try to solve the problem within the token budget.""" - t0 = time.time() sandbox = PythonSandbox() if tir else None - conversation: list[Turn] = [] # full trace - messages: list[dict] = [] # current API messages + conversation: list[Turn] = [] + messages: list[dict] = [] n_compactions = 0 n_code_calls = 0 n_code_errors = 0 peak_tokens = 0 - last_content = "" error_msg = None finish = "max_turns" - # Select system prompt - if compaction: - sys_prompt = SYSTEM_COMPACT.format( - token_limit=token_limit, max_compactions=MAX_COMPACTIONS - ) + active_compaction_hint = compaction_hint.strip() if compaction_hint else DEFAULT_COMPACTION_PROMPT + + is_arc = (topic == "arc") + is_anthropic = isinstance(client, AnthropicOAuthClient) + + if is_arc: + if is_anthropic: + # Anthropic OAuth: fixed system prompt, ARC strategy in user message + sys_prompt = AnthropicOAuthClient.FIXED_SYSTEM + user_content = ARC_SYSTEM_PROMPT + "\n\n" + problem_text + else: + # All other providers: ARC system prompt, problem in user message + sys_prompt = ARC_SYSTEM_PROMPT + user_content = problem_text else: - sys_prompt = SYSTEM_HARD.format(token_limit=token_limit) + # AIMO3 math — existing behavior + if system_prompt_override is not None: + sys_prompt = system_prompt_override + elif compaction: + sys_prompt = SYSTEM_COMPACT.format( + token_limit=token_limit, max_compactions=MAX_COMPACTIONS + ) + else: + sys_prompt = SYSTEM_HARD.format(token_limit=token_limit) + user_content = problem_text messages = [ {"role": "system", "content": sys_prompt}, - {"role": "user", "content": problem_text}, + {"role": "user", "content": user_content}, ] conversation.append(Turn(role="system", content=sys_prompt)) - conversation.append(Turn(role="user", content=problem_text)) + conversation.append(Turn(role="user", content=user_content)) for turn_i in range(MAX_TURNS): - # Calculate remaining budget - # We estimate prompt_tokens from the last known total. - # On the first call, we don't know yet — use a generous max_tokens. if peak_tokens > 0: - estimated_prompt = peak_tokens # last total ≈ next prompt - remaining = token_limit - estimated_prompt + remaining = token_limit - peak_tokens else: - remaining = token_limit # first call, let API figure it out + remaining = token_limit if remaining <= 0: - if compaction: - finish = "budget_exceeded" - else: - finish = "truncated" + finish = "budget_exceeded" if compaction else "truncated" break - # Generate + # In Compact config, cap generation at 50% of token_limit so we can + # inject compaction right at the boundary (not after overshooting). + if compaction and peak_tokens < 0.5 * token_limit: + compact_ceiling = int(0.5 * token_limit) - peak_tokens + capped_tokens = min(remaining, MAX_COMPLETION_TOKENS, max(1, compact_ceiling)) + else: + capped_tokens = min(remaining, MAX_COMPLETION_TOKENS) try: - resp = client.generate(messages, max_tokens=remaining) + resp = client.generate(messages, max_tokens=capped_tokens) except Exception as e: error_msg = f"API error: {e}" finish = "error" break + if resp["finish_reason"] in ("length", "truncated"): + if is_arc: + from arc.arc_evaluator import extract_all_numbered_answers + if not extract_all_numbered_answers(resp["content"]): + finish = "truncated" + elif extract_boxed_answer(resp["content"]) is None: + finish = "truncated" + content = resp["content"] total_now = resp["total_tokens"] peak_tokens = max(peak_tokens, total_now) - last_content = content + + # Enforce budget BEFORE answer check — required for thinking models (e.g. Qwen3.6+) + # where reasoning tokens bypass max_tokens cap and total_now >> token_limit. + # Without this check, a thinking model can "solve" a problem using its full + # reasoning budget even when token_limit=288. + if total_now >= token_limit: + finish = "budget_exceeded" if compaction else "truncated" + break turn = Turn( role="assistant", @@ -354,54 +1143,86 @@ def run_trial( total_tokens=total_now, finish_reason=resp["finish_reason"], ) - conversation.append(turn) - # ── Check for boxed answer FIRST (highest priority) ── - answer = extract_boxed_answer(content) - if answer is not None: - finish = "solved" - break + if is_arc: + arc_result = evaluate_arc_answer(content, correct_answer) + if arc_result["correct"]: + finish = "solved" + break + elif arc_result["num_answers_found"] > 0: + # Model provided answer tags but got it wrong + finish = "wrong_answer" + break + else: + answer = extract_boxed_answer(content) + if answer is not None: + finish = "solved" + break - # ── Check for compact call ── compact_summary = extract_compact_call(content) if compaction else None if compact_summary is not None: turn.compact_summary = compact_summary n_compactions += 1 - if n_compactions > MAX_COMPACTIONS: finish = "max_compactions" break - - # Reset conversation with summary + hint_line = f"\nHint: {active_compaction_hint}" if active_compaction_hint else "" restart_user_msg = POST_COMPACT_USER.format( - problem_text=problem_text, + problem_text=problem_text + hint_line, summary=compact_summary, ) messages = [ {"role": "system", "content": sys_prompt}, {"role": "user", "content": restart_user_msg}, ] - # Reset peak tracking for new window peak_tokens = 0 + conversation.append(Turn(role="user", content=f"[COMPACTION #{n_compactions} — context reset]")) + continue + + # Harness-forced compaction: if Compact config and we've crossed 50% of token budget + # and the model didn't voluntarily compact, force a summary + context reset. + if compaction and total_now >= 0.5 * token_limit and compact_summary is None: + force_prompt = ( + "You have used over 50% of your context budget. " + "Summarize your progress, approach, and any intermediate results so far. " + "Be concise but preserve all critical information needed to continue solving this problem." + ) + try: + force_resp = client.generate( + messages + [{"role": "user", "content": force_prompt}], + max_tokens=500, + ) + summary = force_resp["content"] + except Exception as e: + summary = f"[forced compaction failed: {e}]" + + n_compactions += 1 + conversation.append(Turn( + role="assistant", + content=summary, + forced_compact=True, + )) conversation.append(Turn( role="user", - content=f"[COMPACTION #{n_compactions} — context reset]", + content=f"[FORCED COMPACTION #{n_compactions} at {int(100 * total_now / token_limit)}% — context reset]", )) + messages = [ + {"role": "system", "content": sys_prompt}, + {"role": "user", "content": POST_COMPACT_USER.format( + problem_text=problem_text, + summary=summary, + )}, + ] + peak_tokens = 0 continue - # ── Check budget exceeded (compaction mode = hard fail) ── if total_now >= token_limit: - if compaction: - finish = "budget_exceeded" - else: - finish = "truncated" + finish = "budget_exceeded" if compaction else "truncated" break - # ── Check for python code blocks (TIR mode) ── code_blocks = extract_python_blocks(content) if tir else [] if code_blocks: - # Execute ALL code blocks in order (variables persist) all_outputs = [] for code in code_blocks: n_code_calls += 1 @@ -410,11 +1231,8 @@ def run_trial( n_code_errors += 1 all_outputs.append(output) combined_output = "\n---\n".join(all_outputs) - - # Truncate long output if len(combined_output) > 2000: combined_output = combined_output[:2000] + "\n... (truncated)" - code_turn = Turn( role="user", content=f"Code output:\n{combined_output}", @@ -426,22 +1244,36 @@ def run_trial( messages.append({"role": "user", "content": f"Code output:\n{combined_output}"}) continue - # ── No code, no answer — prompt to continue ── messages.append({"role": "assistant", "content": content}) messages.append({"role": "user", "content": "Continue solving."}) conversation.append(Turn(role="user", content="Continue solving.")) - # ── Extract answer ── - # Try to find answer from the full conversation + # Extract final answer from conversation answer = None - for t in reversed(conversation): - if t.role == "assistant": - answer = extract_boxed_answer(t.content) - if answer is not None: + if is_arc: + # For ARC, evaluate against ground truth grids + for t in reversed(conversation): + if t.role == "assistant": + arc_result = evaluate_arc_answer(t.content, correct_answer) + if arc_result["num_answers_found"] > 0: + answer = "arc_answer_found" + break + elapsed = time.time() - t0 + # Re-evaluate the last assistant response for correctness + success = False + for t in reversed(conversation): + if t.role == "assistant": + arc_result = evaluate_arc_answer(t.content, correct_answer) + success = arc_result["correct"] break - - elapsed = time.time() - t0 - success = answer is not None and answer == correct_answer + else: + for t in reversed(conversation): + if t.role == "assistant": + answer = extract_boxed_answer(t.content) + if answer is not None: + break + elapsed = time.time() - t0 + success = answer is not None and answer == correct_answer return TrialResult( problem_id=problem_id, @@ -468,9 +1300,8 @@ def run_trial( @dataclass class WindowTest: - """Result of testing one window size.""" window: int - trials: list # list of TrialResult dicts + trials: list n_success: int n_trials: int pass_rate: float @@ -478,20 +1309,18 @@ class WindowTest: def binary_search( - client: LLMClient, + client, problem_id: str, problem_text: str, - correct_answer: int, + correct_answer, tir: bool, compaction: bool, min_window: int = MIN_WINDOW, max_window: int = MAX_WINDOW, trials: int = TRIALS_PER_WINDOW, + compaction_hint: str = "", + topic: str = "math", ) -> dict: - """ - Binary search (log scale) for minimum context window. - Returns full results dict with all trials. - """ config_name = f"{'Compact' if compaction else 'HardCut'}" print(f"\n{'='*60}") print(f" {problem_id} | {config_name}") @@ -500,11 +1329,11 @@ def binary_search( search_log: list[WindowTest] = [] - # First: verify solvable at max window + # Verify solvable at max window print(f"\n [Verify] Testing max window = {max_window} ...") test = _test_window( client, problem_id, problem_text, correct_answer, - max_window, tir, compaction, trials + max_window, tir, compaction, trials, compaction_hint, topic ) search_log.append(test) print(f" [Verify] {test.n_success}/{test.n_trials} passed ({test.pass_rate:.0%})") @@ -517,23 +1346,19 @@ def binary_search( search_range_final=(min_window, max_window), ) - # Binary search lo, hi = min_window, max_window step = 0 - while hi / lo > CONVERGENCE_RATIO: + while hi / lo > CONVERGENCE_RATIO and (hi - lo) > CONVERGENCE_ABS: step += 1 - mid = int(math.exp((math.log(lo) + math.log(hi)) / 2)) - # Snap to multiples of 64 for cleanliness - mid = max(min_window, (mid // 64) * 64) - - # Avoid re-testing same values + mid = (lo + hi) // 2 + mid = max(min_window, max(1, (mid // 16) * 16)) if mid == lo or mid == hi: break - print(f"\n [Step {step}] Testing window = {mid} (range [{lo}, {hi}], ratio {hi/lo:.3f})") + print(f"\n [Step {step}] Testing window = {mid} (range [{lo}, {hi}], gap {hi-lo}, ratio {hi/lo:.3f})") test = _test_window( client, problem_id, problem_text, correct_answer, - mid, tir, compaction, trials + mid, tir, compaction, trials, compaction_hint, topic ) search_log.append(test) print(f" [Step {step}] {test.n_success}/{test.n_trials} passed ({test.pass_rate:.0%}) → {'hi=mid' if test.passed else 'lo=mid'}") @@ -543,11 +1368,12 @@ def binary_search( else: lo = mid - print(f"\n RESULT: minimum window ≈ {hi} tokens (range [{lo}, {hi}])") - + # Snap to nearest multiple of 16 (round up) + snapped = ((hi + 15) // 16) * 16 + print(f"\n RESULT: minimum window ≈ {hi} tokens → snapped to {snapped} (range [{lo}, {hi}])") return _build_result( problem_id, tir, compaction, search_log, - minimum_window=hi, + minimum_window=snapped, search_range_final=(lo, hi), ) @@ -555,20 +1381,19 @@ def binary_search( def _test_window( client, problem_id, problem_text, correct_answer, window, tir, compaction, n_trials, + compaction_hint: str = "", + topic: str = "math", ) -> WindowTest: - """Run N trials at a given window size, in parallel.""" t0 = time.time() def _run_one(i): return run_trial( client, problem_id, problem_text, correct_answer, - token_limit=window, - tir=tir, - compaction=compaction, - trial_idx=i, + token_limit=window, tir=tir, compaction=compaction, + trial_idx=i, compaction_hint=compaction_hint, + topic=topic, ) - # Run all trials in parallel (server has enough slots) trials_results = [None] * n_trials n_success = 0 with ThreadPoolExecutor(max_workers=n_trials) as pool: @@ -587,12 +1412,9 @@ def _run_one(i): pass_rate = n_success / n_trials print(f" [{n_trials} trials in {elapsed:.1f}s wall, {n_success}/{n_trials} passed]") return WindowTest( - window=window, - trials=trials_results, - n_success=n_success, - n_trials=n_trials, - pass_rate=pass_rate, - passed=pass_rate >= SUCCESS_THRESHOLD, + window=window, trials=trials_results, + n_success=n_success, n_trials=n_trials, + pass_rate=pass_rate, passed=pass_rate >= SUCCESS_THRESHOLD, ) @@ -611,15 +1433,101 @@ def _build_result(problem_id, tir, compaction, search_log, minimum_window, searc } -# ─── Main ──────────────────────────────────────────────────────────────────── +# ─── Unbounded Mode ─────────────────────────────────────────────────────────── + +def run_unbounded( + client, + model_name: str, + problem_id: str, + problem_text: str, + correct_answer, + n_runs: int = 5, + topic: str = "math", + tir: bool = False, +) -> dict: + """ + Run problem n_runs times with no artificial context window constraints. + Uses the model's full context window. No compaction, no token limit hints + in the system prompt — just a clean "solve this problem" prompt. + + Returns a result dict with schema: + {model_name, problem_id, config: "Unbounded", context_window, n_runs, + runs: [{tokens_used, solved, answer, wall_time_s}, ...], + avg_tokens, min_tokens, max_tokens, solve_rate, timestamp} + """ + context_window = get_model_context_window(model_name) + is_arc = (topic == "arc") + + # Clean system prompt — no mention of token limits or context windows + sys_prompt_override = None if is_arc else SYSTEM_UNBOUNDED + + print(f"\n{'='*60}") + print(f" {problem_id} | Unbounded | model={model_name}") + print(f" Context window: {context_window:,} | n_runs: {n_runs}") + print(f"{'='*60}") + + runs = [] + for i in range(n_runs): + print(f"\n [Unbounded] Run {i+1}/{n_runs} ...") + result = run_trial( + client=client, + problem_id=problem_id, + problem_text=problem_text, + correct_answer=correct_answer, + token_limit=context_window, + tir=tir, + compaction=False, + trial_idx=i, + topic=topic, + system_prompt_override=sys_prompt_override, + ) + run_entry = { + "tokens_used": result.total_tokens_peak, + "solved": result.success, + "answer": str(result.answer) if result.answer is not None else None, + "wall_time_s": result.wall_time_s, + } + runs.append(run_entry) + status = "OK" if result.success else "FAIL" + print(f" [Unbounded] Run {i+1}: {status} | {result.total_tokens_peak} tok | {result.wall_time_s}s") + + all_tokens = [r["tokens_used"] for r in runs] + n_solved = sum(1 for r in runs if r["solved"]) + avg_tokens = int(round(sum(all_tokens) / len(all_tokens))) if all_tokens else 0 + min_tokens = min(all_tokens) if all_tokens else 0 + max_tokens = max(all_tokens) if all_tokens else 0 + solve_rate = n_solved / n_runs if n_runs > 0 else 0.0 + + result_data = { + "model_name": model_name, + "problem_id": problem_id, + "config": "Unbounded", + "context_window": context_window, + "n_runs": n_runs, + "runs": runs, + "avg_tokens": avg_tokens, + "min_tokens": min_tokens, + "max_tokens": max_tokens, + "solve_rate": solve_rate, + "timestamp": datetime.now(timezone.utc).isoformat(), + } + + RESULTS_DIR.mkdir(exist_ok=True) + outpath = result_filename(model_name, problem_id, "Unbounded") + outpath.write_text(json.dumps(result_data, indent=2, default=str)) + print(f"\n Saved (Unbounded): {outpath.name}") + print(f" solve_rate={solve_rate:.2f} avg={avg_tokens} min={min_tokens} max={max_tokens}") + + return result_data + + +# ─── Problem Loading ───────────────────────────────────────────────────────── def load_problem(problem_id: str) -> dict: - """Load a problem JSON from the problems/ directory.""" - # Try exact match + """Load a problem JSON from problems/. Matches exact stem or substring.""" path = PROBLEMS_DIR / f"{problem_id}.json" if path.exists(): return json.loads(path.read_text()) - # Try fuzzy match (e.g., "ab507a9f" matches "aimo3_hard_ab507a9f.json") for p in PROBLEMS_DIR.glob("*.json"): if problem_id in p.stem: return json.loads(p.read_text()) @@ -630,19 +1538,42 @@ def load_all_problems() -> list[dict]: return [json.loads(p.read_text()) for p in sorted(PROBLEMS_DIR.glob("*.json"))] +# ─── Result Filename Helpers ───────────────────────────────────────────────── + +def result_filename(model_name: str, problem_id: str, config_name: str) -> Path: + """ + Build result file path for a given model/problem/config combination. + Format: results/{model_name}_{problem_id}_{config_name}.json + Model name is sanitized (spaces → underscores, slashes → dashes). + """ + safe_model = re.sub(r"[^\w\-]", "_", model_name) + return RESULTS_DIR / f"{safe_model}_{problem_id}_{config_name}.json" + + +def summary_filename(model_name: str, problem_id: str) -> Path: + safe_model = re.sub(r"[^\w\-]", "_", model_name) + return RESULTS_DIR / f"{safe_model}_{problem_id}_summary.json" + + +# ─── Single-Problem Runner ─────────────────────────────────────────────────── + def run_problem( - client: LLMClient, + client, problem: dict, + model_name: str = "unknown", configs: list[tuple[bool, bool]] = None, min_window: int = MIN_WINDOW, max_window: int = MAX_WINDOW, trials: int = TRIALS_PER_WINDOW, ): - """Run binary search for all configs on one problem. Save results.""" + """ + Run binary search for all configs on one problem. Save per-config and summary results. + Results namespaced by model_name to prevent multi-model collisions. + """ if configs is None: configs = [ - (False, False), # Hard Cutoff (no tools) - (False, True), # Compaction (compact tool only) + (False, False), # NoTIR + HardCut + (False, True), # NoTIR + Compact ] pid = problem["problem_id"] @@ -650,7 +1581,40 @@ def run_problem( all_results = [] for tir, compaction in configs: - config_name = f"{'Compact' if compaction else 'HardCut'}" + config_name = f"{'TIR' if tir else 'NoTIR'}_{'Compact' if compaction else 'HardCut'}" + outpath = result_filename(model_name, pid, config_name) + + # Resume: skip if valid completed result exists + if outpath.exists(): + try: + existing = json.loads(outpath.read_text()) + if existing.get("minimum_window") is not None or existing.get("binary_search"): + print(f"\n [SKIP] {model_name} | {pid} | {config_name} — result exists at {outpath.name}") + all_results.append(existing) + continue + except Exception: + pass + + # Prediction phase + prediction = run_prediction_phase(client, problem, max_tokens=300) + compaction_hint = prediction.get("compaction_prompt", DEFAULT_COMPACTION_PROMPT) + + if not prediction.get("success_prediction", True): + print(f"\n [Prediction Phase] Model opted out. Skipping binary search for {pid} | {config_name}.") + result = _build_result( + pid, tir, compaction, [], + minimum_window=None, + search_range_final=(min_window, max_window), + ) + result["prediction"] = prediction + result["model_name"] = model_name + all_results.append(result) + outpath.write_text(json.dumps(result, indent=2, default=str)) + print(f"\n Saved (opt-out): {outpath.name}") + continue + + # Binary search + problem_topic = problem.get("topic", "math") result = binary_search( client, problem_id=pid, @@ -661,104 +1625,335 @@ def run_problem( min_window=min_window, max_window=max_window, trials=trials, + compaction_hint=compaction_hint, + topic=problem_topic, ) - result["model"] = "Qwen3.5-35B-A3B-Q4_K_M" + result["model_name"] = model_name + result["prediction"] = prediction all_results.append(result) - # Save per-config result (with full traces) - outpath = RESULTS_DIR / f"{pid}_{config_name}.json" outpath.write_text(json.dumps(result, indent=2, default=str)) - print(f"\n Saved: {outpath}") + print(f"\n Saved: {outpath.name}") - # Save combined summary (without conversation traces for readability) + # Save combined summary (compact, no conversation traces) summary = [] for r in all_results: - summary.append({ + entry = { + "model_name": model_name, "problem_id": r["problem_id"], - "config": r["config"]["name"], + "config": r["config"]["name"] if isinstance(r.get("config"), dict) else r.get("config"), "minimum_window": r["minimum_window"], - "search_range_final": r["search_range_final"], - "steps": len(r["binary_search"]), - }) + "search_range_final": r.get("search_range_final"), + "steps": len(r.get("binary_search", [])), + } + pred = r.get("prediction") + if pred: + entry["n_reliable_prediction"] = pred.get("n_reliable_prediction") + entry["success_prediction"] = pred.get("success_prediction") + summary.append(entry) - summary_path = RESULTS_DIR / f"{pid}_summary.json" - summary_path.write_text(json.dumps(summary, indent=2)) - print(f"\n Summary: {summary_path}") + sp = summary_filename(model_name, pid) + sp.write_text(json.dumps(summary, indent=2)) + print(f"\n Summary: {sp.name}") return all_results +# ─── Multi-Model Runner ────────────────────────────────────────────────────── + +def load_models_json() -> list[dict]: + """Load models.json from the AmnesiaBench directory. Returns list of {name, url} dicts.""" + if not MODELS_JSON.exists(): + raise FileNotFoundError( + f"models.json not found at {MODELS_JSON}. " + "Create it with a list of {{name, url}} entries." + ) + models = json.loads(MODELS_JSON.read_text()) + if not isinstance(models, list) or not models: + raise ValueError("models.json must be a non-empty list of {name, url} objects.") + for m in models: + if "name" not in m or "url" not in m: + raise ValueError(f"Each model entry must have 'name' and 'url' keys. Got: {m}") + return models + + +def run_all_models( + problems: list[dict], + configs: list[tuple[bool, bool]] = None, + min_window: int = MIN_WINDOW, + max_window: int = MAX_WINDOW, + trials: int = TRIALS_PER_WINDOW, + temperature: float = TEMPERATURE, + cli_api_key: str = None, +): + """ + Iterate over all models in models.json, run all problems for each model. + Models are run sequentially (one model at a time, all problems per model). + If a model's server is unreachable, it is skipped with a warning. + Supports api_key_env field in models.json for Gemini-style API key lookup. + """ + models = load_models_json() + print(f"\n{'#'*70}") + print(f" --run-all-models: {len(models)} model(s) × {len(problems)} problem(s)") + for m in models: + print(f" {m['name']} → {m['url']}") + print(f"{'#'*70}\n") + + for model_entry in models: + mname = model_entry["name"] + murl = model_entry["url"] + print(f"\n{'#'*70}") + print(f" MODEL: {mname}") + print(f" URL: {murl}") + print(f"{'#'*70}") + + # Resolve API key: cli flag > api_key_env field > env var GEMINI_API_KEY + api_key = cli_api_key + api_key_env = model_entry.get("api_key_env") + if not api_key and api_key_env: + api_key = os.environ.get(api_key_env) + if api_key: + print(f" API key resolved from env var: {api_key_env}") + else: + print(f" WARNING: api_key_env='{api_key_env}' not found in environment") + + try: + client = create_client( + server_url=murl, + api_key=api_key, + model_name=mname, + temperature=temperature, + ) + except ValueError as e: + print(f" ERROR: Could not create client for {mname}: {e} — skipping") + continue + + if not client.ping(): + print(f" WARNING: Cannot reach server at {murl} — skipping {mname}") + continue + + print(f" Server OK: {murl}") + for problem in problems: + print(f"\n{'='*60}") + print(f" PROBLEM: {problem['problem_id']}") + print(f" Answer: {problem['ground_truth']}") + print(f"{'='*60}") + run_problem( + client, problem, + model_name=mname, + configs=configs, + min_window=min_window, + max_window=max_window, + trials=trials, + ) + + print("\n\nAll models done. Run --scores for composite scoring table.") + + +# ─── Analysis ──────────────────────────────────────────────────────────────── + def analyze_results(): - """Print a summary table of all completed results.""" - results_files = sorted(RESULTS_DIR.glob("*_summary.json")) - if not results_files: + """Print a per-model summary table of all completed results.""" + summary_files = sorted(RESULTS_DIR.glob("*_summary.json")) + if not summary_files: print("No results found. Run experiments first.") return - print(f"\n{'Problem':<30} {'Config':<20} {'Min Window':>10} {'Range':>16}") - print("-" * 80) - for f in results_files: - data = json.loads(f.read_text()) + print(f"\n{'Model':<25} {'Problem':<30} {'Config':<24} {'Min Window':>10} {'Range':>18} {'Steps':>6}") + print("-" * 118) + + current_model = None + for f in summary_files: + try: + data = json.loads(f.read_text()) + except Exception as e: + print(f" [analyze] Could not read {f.name}: {e}") + continue + for entry in data: - lo, hi = entry["search_range_final"] - mw = entry["minimum_window"] + model = entry.get("model_name", "unknown") + pid = entry.get("problem_id", "?") + config = entry.get("config", "?") + mw = entry.get("minimum_window") mw_str = str(mw) if mw is not None else "UNSOLVABLE" - print(f"{entry['problem_id']:<30} {entry['config']:<20} {mw_str:>10} [{lo:>6}, {hi:>6}]") + sr = entry.get("search_range_final", ["-", "-"]) + lo, hi = sr if sr else ("-", "-") + steps = entry.get("steps", "?") + + if model != current_model: + if current_model is not None: + print() + current_model = model + + print(f"{model:<25} {pid:<30} {config:<24} {mw_str:>10} [{str(lo):>6}, {str(hi):>6}] {str(steps):>6}") + + +# ─── Main ──────────────────────────────────────────────────────────────────── + +def derive_model_name(url: str) -> str: + """Derive a short model name from the server URL.""" + url = url.rstrip("/") + # For gemini:// URLs extract the model name directly + if url.startswith("gemini://") or url.startswith("google://"): + scheme = "gemini://" if url.startswith("gemini://") else "google://" + return url[len(scheme):].strip("/") or "gemini" + # For anthropic:// URLs extract the model name directly + if url.startswith("anthropic://"): + return url[len("anthropic://"):].strip("/") or "claude-sonnet-4-6" + # Extract host:port, replace dots/colons with underscores + host_port = url.split("//")[-1] + return re.sub(r"[^\w]", "_", host_port) def main(): - parser = argparse.ArgumentParser(description="AmnesiaBench — context window binary search") + parser = argparse.ArgumentParser(description="AmnesiaBench v2 — multi-model context window benchmark") group = parser.add_mutually_exclusive_group(required=True) group.add_argument("--problem", type=str, help="Problem ID (or substring) to test") group.add_argument("--all", action="store_true", help="Run all problems") group.add_argument("--analyze", action="store_true", help="Analyze existing results") + group.add_argument("--scores", action="store_true", help="Print composite Scott scoring table") + + parser.add_argument("--model", type=str, default=SERVER_URL, + help=f"Server URL (default: {SERVER_URL}). Use gemini://MODEL for Gemini.") + parser.add_argument("--model-name", type=str, default=None, + help="Label for this model in results (default: derived from --model URL)") + parser.add_argument("--api-key", type=str, default=None, + help="API key for Gemini backends (overrides GEMINI_API_KEY env var)") + parser.add_argument("--run-all-models", action="store_true", + help="Iterate over all models in models.json (overrides --model/--model-name)") - parser.add_argument("--server", type=str, default=SERVER_URL, help="llama.cpp server URL") parser.add_argument("--min-window", type=int, default=MIN_WINDOW) parser.add_argument("--max-window", type=int, default=MAX_WINDOW) parser.add_argument("--trials", type=int, default=TRIALS_PER_WINDOW) parser.add_argument("--temperature", type=float, default=TEMPERATURE) parser.add_argument("--config", type=str, default=None, help="Run specific config only: NoTIR_HardCut, TIR_HardCut, NoTIR_Compact, TIR_Compact") + parser.add_argument("--results-dir", type=str, default=None, + help="Results directory for --scores / --analyze (default: ./results)") args = parser.parse_args() + # Redirect results dir if specified + if args.results_dir: + global RESULTS_DIR + RESULTS_DIR = Path(args.results_dir) + if args.analyze: analyze_results() return + if args.scores: + rd = Path(args.results_dir) if args.results_dir else None + calculate_scores(rd) + return + min_window = args.min_window max_window = args.max_window trials_per_window = args.trials - client = LLMClient(server_url=args.server, temperature=args.temperature) - if not client.ping(): - print(f"ERROR: Cannot reach llama.cpp server at {args.server}") - print(f"Start it first:\n llama-server --model --host 0.0.0.0 --port 8080 --ctx-size 65536") - sys.exit(1) - print(f"Server OK: {args.server}") - - # Parse config filter + # Config filter configs = None if args.config: config_map = { + "NoTIR_HardCut": (False, False), + "TIR_HardCut": (True, False), + "NoTIR_Compact": (False, True), + "TIR_Compact": (True, True), + # Legacy short names "HardCut": (False, False), "Compact": (False, True), + # Unbounded mode — no binary search, full context window, no token hints + "Unbounded": None, } if args.config not in config_map: print(f"ERROR: Unknown config '{args.config}'. Choose from: {list(config_map.keys())}") sys.exit(1) - configs = [config_map[args.config]] + if args.config == "Unbounded": + configs = "unbounded" + else: + configs = [config_map[args.config]] + # Load problems if args.all: problems = load_all_problems() else: problems = [load_problem(args.problem)] + # Resolve API key: --api-key > scheme-specific env var > GEMINI_API_KEY fallback + _model_url = args.model + if args.api_key: + api_key = args.api_key + elif _model_url.startswith("openrouter://"): + api_key = os.environ.get("OPENROUTER_API_KEY") + elif _model_url.startswith("anthropic://"): + api_key = os.environ.get("ANTHROPIC_OAUTHTOKEN") + else: + api_key = os.environ.get("GEMINI_API_KEY") + + # Multi-model mode + if args.run_all_models: + run_all_models( + problems=problems, + configs=configs, + min_window=min_window, + max_window=max_window, + trials=trials_per_window, + temperature=args.temperature, + cli_api_key=api_key, + ) + return + + # Single-model mode (must create client before Unbounded dispatch below) + model_url = args.model + model_name = args.model_name or derive_model_name(model_url) + + try: + client = create_client( + server_url=model_url, + api_key=api_key, + model_name=model_name, + temperature=args.temperature, + ) + except ValueError as e: + print(f"ERROR: {e}") + sys.exit(1) + + if not client.ping(): + print(f"ERROR: Cannot reach server at {model_url}") + if model_url.startswith("http"): + print(f"Start it first:\n llama-server --model --host 0.0.0.0 --port 8080 --ctx-size 65536") + else: + print(f"Check your API key and model name.") + sys.exit(1) + print(f"Server OK: {model_url} (model_name: {model_name})") + + # Unbounded mode: bypass binary search entirely + if configs == "unbounded": + print(f"Problems: {[p['problem_id'] for p in problems]}") + print(f"Trials (n_runs): {trials_per_window}") + print(f"Config: Unbounded (full context window, no token hints)") + print() + for problem in problems: + print(f"\n{'#'*60}") + print(f" PROBLEM: {problem['problem_id']}") + print(f" Answer: {problem['ground_truth']}") + print(f"{'#'*60}") + run_unbounded( + client=client, + model_name=model_name, + problem_id=problem["problem_id"], + problem_text=problem["problem_text"], + correct_answer=problem["ground_truth"], + n_runs=trials_per_window, + topic=problem.get("topic", "math"), + ) + print("\n\nAll done (Unbounded). Run --analyze to see summary.") + return + print(f"Problems: {[p['problem_id'] for p in problems]}") print(f"Search range: [{min_window}, {max_window}]") print(f"Trials per window: {trials_per_window}") - print(f"Configs: {[c for c in (configs or [(False,False),(False,True)])]}") + print(f"Configs: {configs or [(False,False),(False,True)]}") print() for problem in problems: @@ -767,11 +1962,16 @@ def main(): print(f" Answer: {problem['ground_truth']}") print(f" 120B pass rate: {problem.get('gptoss_120b_pass_rate', '?')}") print(f"{'#'*60}") - run_problem(client, problem, configs=configs, - min_window=min_window, max_window=max_window, - trials=trials_per_window) + run_problem( + client, problem, + model_name=model_name, + configs=configs, + min_window=min_window, + max_window=max_window, + trials=trials_per_window, + ) - print("\n\nAll done. Run --analyze to see summary.") + print("\n\nAll done. Run --analyze to see summary or --scores for composite score table.") if __name__ == "__main__": diff --git a/arc/__init__.py b/arc/__init__.py new file mode 100644 index 0000000..234b5ab --- /dev/null +++ b/arc/__init__.py @@ -0,0 +1 @@ +# ARC support module for AmnesiaBench diff --git a/arc/arc_evaluator.py b/arc/arc_evaluator.py new file mode 100644 index 0000000..bd516f9 --- /dev/null +++ b/arc/arc_evaluator.py @@ -0,0 +1,181 @@ +# Author: Claude Sonnet 4.6 +# Date: 30-March-2026 +# PURPOSE: ARC Answer Evaluator for AmnesiaBench. Parses model responses containing +# grid answers inside numbered tags — one attempt per test pair. +# Single test: . Two tests: + . Etc. +# Task is solved if ALL test pairs match exactly. No external dependencies. +# SRP/DRY check: Pass — extraction and evaluation are cleanly separated functions, +# grid parsing logic is not duplicated. + +from __future__ import annotations + +import json +import re +import sys +from typing import Optional + + +def _parse_grid(raw: str) -> Optional[list[list[int]]]: + """Parse space-separated rows into a 2D list of ints.""" + raw = raw.strip() + if not raw: + return None + grid = [] + for line in raw.split("\n"): + line = line.strip() + if not line: + continue + try: + row = [int(x) for x in line.split()] + if row: + grid.append(row) + except ValueError: + return None + return grid if grid else None + + +def extract_grid_answer(response_text: str, index: int = 1) -> Optional[list[list[int]]]: + """Extract grid from tag where N = index.""" + match = re.search(rf"\s*(.*?)\s*", response_text, re.DOTALL | re.IGNORECASE) + if not match: + return None + return _parse_grid(match.group(1)) + + +def extract_all_numbered_answers(response_text: str) -> dict[int, Optional[list[list[int]]]]: + """ + Extract all ... blocks from response. + Returns dict mapping N -> parsed grid (or None if unparseable). + """ + matches = re.finditer(r"\s*(.*?)\s*", response_text, re.DOTALL | re.IGNORECASE) + results = {} + for m in matches: + idx = int(m.group(1)) + results[idx] = _parse_grid(m.group(2)) + return results + + +def evaluate_single_grid(predicted: Optional[list[list[int]]], ground_truth: list[list[int]]) -> dict: + """Evaluate one predicted grid against one ground truth grid.""" + if predicted is None: + return {"correct": False, "predicted_grid": None, "expected_grid": ground_truth, "dimensions_match": False} + + pred_rows, gt_rows = len(predicted), len(ground_truth) + pred_cols = len(predicted[0]) if predicted else 0 + gt_cols = len(ground_truth[0]) if ground_truth else 0 + + return { + "correct": predicted == ground_truth, + "predicted_grid": predicted, + "expected_grid": ground_truth, + "dimensions_match": (pred_rows == gt_rows) and (pred_cols == gt_cols), + } + + +def evaluate_arc_answer(response_text: str, ground_truth: list) -> dict: + """ + Evaluate model's ARC answer against ground truth. + + ground_truth: list of 2D grids (one per test pair). + Model provides for test 1, for test 2, etc. + One attempt per test pair. Task solved if all pairs match exactly. + """ + if not ground_truth: + return {"correct": False, "num_test_pairs": 0, "per_pair": []} + + # Detect legacy single-grid format + is_multi = isinstance(ground_truth[0], list) and ground_truth[0] and isinstance(ground_truth[0][0], list) + if not is_multi: + ground_truth = [ground_truth] + + answers = extract_all_numbered_answers(response_text) + + per_pair = [] + for i, gt in enumerate(ground_truth): + # answer_1 = test pair 0, answer_2 = test pair 1, etc. + pred = answers.get(i + 1) + result = evaluate_single_grid(pred, gt) + result["test_pair_index"] = i + result["answer_tag"] = f"answer_{i + 1}" + per_pair.append(result) + + return { + "correct": all(p["correct"] for p in per_pair), + "num_test_pairs": len(ground_truth), + "num_answers_found": len(answers), + "per_pair": per_pair, + } + + +# ── Tests ───────────────────────────────────────────────────────────────────── + +if __name__ == "__main__": + print("ARC Evaluator — Self-Test") + print("=" * 50) + + # 1: Single test correct + gt1 = [[[0, 0, 2], [0, 1, 0], [2, 2, 2]]] + r1 = evaluate_arc_answer("\n0 0 2\n0 1 0\n2 2 2\n", gt1) + assert r1["correct"]; print(" [PASS] 1: Single test correct") + + # 2: Single test wrong + r2 = evaluate_arc_answer("\n0 0 0\n0 0 0\n0 0 0\n", gt1) + assert not r2["correct"]; print(" [PASS] 2: Single test wrong") + + # 3: No tags + r3 = evaluate_arc_answer("no answer", gt1) + assert not r3["correct"]; print(" [PASS] 3: No tags") + + # 4: Two tests both correct + gt4 = [[[1, 2], [3, 4]], [[5, 6], [7, 8]]] + r4 = evaluate_arc_answer("\n1 2\n3 4\n\n\n5 6\n7 8\n", gt4) + assert r4["correct"]; print(" [PASS] 4: Two tests both correct") + + # 5: Two tests, second wrong + r5 = evaluate_arc_answer("\n1 2\n3 4\n\n\n0 0\n0 0\n", gt4) + assert not r5["correct"] + assert r5["per_pair"][0]["correct"] and not r5["per_pair"][1]["correct"] + print(" [PASS] 5: Two tests, second wrong") + + # 6: Missing answer_2 + r6 = evaluate_arc_answer("\n1 2\n3 4\n", gt4) + assert not r6["correct"]; print(" [PASS] 6: Missing answer_2 = fail") + + # 7: Three tests all correct + gt7 = [[[1, 1]], [[2, 2]], [[3, 3]]] + r7 = evaluate_arc_answer("\n1 1\n\n\n2 2\n\n\n3 3\n", gt7) + assert r7["correct"]; print(" [PASS] 7: Three tests correct") + + # 8: Case insensitive + r8 = evaluate_arc_answer("\n0 0 2\n0 1 0\n2 2 2\n", gt1) + assert r8["correct"]; print(" [PASS] 8: Case insensitive") + + # 9: Legacy single grid + r9 = evaluate_arc_answer("\n1 2\n3 4\n", [[1, 2], [3, 4]]) + assert r9["correct"]; print(" [PASS] 9: Legacy format") + + # 10: Empty tags + r10 = evaluate_arc_answer("\n\n", gt1) + assert not r10["correct"]; print(" [PASS] 10: Empty tags") + + # 11: Tags out of order still work + r11 = evaluate_arc_answer("\n5 6\n7 8\n\n\n1 2\n3 4\n", gt4) + assert r11["correct"]; print(" [PASS] 11: Tags out of order") + + print("\nAll 11 tests passed!") + + try: + with open("arc_problems.json") as f: + problems = json.load(f) + print(f"\nValidating {len(problems)} problems...") + for p in problems: + gt = p["ground_truth"] + blocks = [] + for i, grid in enumerate(gt, 1): + grid_text = "\n".join(" ".join(str(c) for c in row) for row in grid) + blocks.append(f"\n{grid_text}\n") + result = evaluate_arc_answer("\n".join(blocks), gt) + assert result["correct"], f"Failed: {p['problem_id']}" + print(f" All {len(problems)} problems validate ✅") + except FileNotFoundError: + print("\n (arc_problems.json not found)") diff --git a/arc/arc_problems.json b/arc/arc_problems.json new file mode 100644 index 0000000..2e9a32e --- /dev/null +++ b/arc/arc_problems.json @@ -0,0 +1,24124 @@ +[ + { + "problem_id": "arc1_50f325b5", + "problem_text": "ARC Puzzle: Predict the test output grid.\n\nTraining Example 1:\nInput:\n2 2 0 7 0 3 2 7 0 2 7 0 3 2 7 0 0 3\n2 2 0 0 2 3 3 4 0 0 7 0 0 0 0 0 0 7\n4 2 7 2 7 0 4 0 0 7 2 0 3 0 7 3 2 0\n3 7 2 2 7 0 0 3 0 2 4 0 2 4 0 4 3 3\n2 4 3 2 0 4 3 2 3 2 0 0 8 8 8 7 0 2\n2 7 3 2 7 0 0 2 3 3 3 7 0 8 2 2 2 0\n0 2 2 2 0 3 2 7 3 3 7 0 0 8 0 0 0 0\n4 2 7 3 0 3 0 7 2 7 2 0 4 2 7 7 0 0\n0 0 2 0 2 0 4 7 4 0 0 2 2 2 3 3 3 0\n2 0 4 7 0 7 0 3 2 4 2 0 0 2 0 0 2 7\n7 4 2 7 4 3 3 7 2 2 0 0 7 7 0 7 0 4\n\nOutput:\n2 2 0 7 0 3 2 7 0 2 7 0 3 2 7 0 0 3\n2 2 0 0 2 3 3 4 0 0 7 0 0 0 0 0 0 7\n4 2 7 2 7 0 4 0 0 7 2 0 3 0 7 3 2 0\n3 7 2 2 7 0 0 3 0 2 4 0 2 4 0 4 3 3\n2 4 3 2 0 4 3 2 8 2 0 0 8 8 8 7 0 2\n2 7 3 2 7 0 0 2 8 8 8 7 0 8 2 2 2 0\n0 2 2 2 0 3 2 7 8 3 7 0 0 8 0 0 0 0\n4 2 7 3 0 3 0 7 2 7 2 0 4 2 7 7 0 0\n0 0 2 0 2 0 4 7 4 0 0 2 2 2 3 3 3 0\n2 0 4 7 0 7 0 3 2 4 2 0 0 2 0 0 2 7\n7 4 2 7 4 3 3 7 2 2 0 0 7 7 0 7 0 4\n\nTraining Example 2:\nInput:\n2 7 7 0 0 3 3 2 2 0 0 2 3 3 7 0 0\n0 3 7 2 2 4 2 7 4 2 7 2 2 7 0 7 2\n2 3 0 3 7 3 0 2 7 2 0 2 2 3 2 3 2\n2 4 7 3 0 0 4 2 4 2 4 0 7 0 3 3 0\n7 3 2 4 3 2 0 0 7 2 0 3 2 2 3 0 2\n2 7 3 7 2 2 2 0 2 2 7 4 2 2 3 0 3\n0 3 0 0 2 3 0 2 2 0 7 7 3 2 0 0 0\n2 0 0 4 0 2 2 2 0 4 4 0 7 0 0 3 2\n3 2 7 0 7 8 0 8 0 4 2 2 2 2 0 0 0\n7 2 3 4 3 2 8 8 2 0 4 0 3 7 0 3 2\n7 7 2 2 0 7 7 4 2 3 2 7 2 2 7 2 3\n0 0 0 4 2 3 0 4 7 7 3 0 7 2 0 3 0\n0 0 7 2 3 0 2 3 0 3 4 2 3 3 3 2 3\n7 2 2 2 2 3 0 3 0 3 3 0 7 0 3 3 2\n\nOutput:\n2 7 7 0 0 3 3 2 2 0 0 2 3 3 7 0 0\n0 3 7 2 2 4 2 7 4 2 7 2 2 7 0 7 2\n2 3 0 3 7 3 0 2 7 2 0 2 2 8 2 8 2\n2 4 7 3 0 0 4 2 4 2 4 0 7 0 8 8 0\n7 3 2 4 3 2 0 0 7 2 0 3 2 2 3 0 2\n2 7 3 7 2 2 2 0 2 2 7 4 2 2 3 0 3\n0 3 0 0 2 3 0 2 2 0 7 7 3 2 0 0 0\n2 0 0 4 0 2 2 2 0 4 4 0 7 0 0 3 2\n3 2 7 0 7 8 0 8 0 4 2 2 2 2 0 0 0\n7 2 3 4 3 2 8 8 2 0 4 0 3 7 0 3 2\n7 7 2 2 0 7 7 4 2 3 2 7 2 2 7 2 3\n0 0 0 4 2 3 0 4 7 7 8 0 7 2 0 8 0\n0 0 7 2 3 0 2 3 0 8 4 2 3 3 8 2 3\n7 2 2 2 2 3 0 3 0 8 8 0 7 0 8 8 2\n\nTraining Example 3:\nInput:\n3 0 0 7 3 3 3 2 2 3 3 2 0 2 4 7 2 0\n0 2 4 0 2 0 7 0 0 2 0 3 2 2 2 2 2 7\n7 0 2 3 0 4 4 7 2 7 7 0 4 0 4 3 0 3\n7 3 0 2 4 3 7 2 0 2 0 3 3 2 2 7 4 0\n0 3 4 3 2 4 3 8 0 2 3 3 4 0 3 0 3 0\n0 2 2 0 7 3 8 8 8 4 3 0 7 3 4 2 2 2\n2 3 2 4 7 0 7 2 0 4 0 0 0 0 7 0 4 7\n3 4 7 7 0 3 2 0 0 7 3 0 2 7 4 2 0 3\n2 3 0 3 3 0 0 2 2 0 7 7 3 0 2 2 2 3\n0 3 3 4 0 3 0 0 2 7 3 0 0 0 2 3 7 3\n0 3 4 3 0 7 2 0 3 0 3 3 0 4 0 2 3 3\n3 2 0 4 0 2 7 3 7 0 3 3 2 0 0 2 2 7\n2 2 3 3 4 3 7 7 2 2 4 0 0 0 4 2 3 2\n0 2 0 2 0 0 4 0 0 3 7 0 0 0 4 3 4 2\n0 4 3 0 0 3 0 0 7 0 0 0 2 3 3 7 4 3\n\nOutput:\n3 0 0 7 3 3 3 2 2 3 3 2 0 2 4 7 2 0\n0 2 4 0 2 0 7 0 0 2 0 3 2 2 2 2 2 7\n7 0 2 3 0 4 4 7 2 7 7 0 4 0 4 3 0 3\n7 3 0 2 4 3 7 2 0 2 0 3 3 2 2 7 4 0\n0 3 4 3 2 4 3 8 0 2 3 3 4 0 3 0 3 0\n0 2 2 0 7 3 8 8 8 4 3 0 7 3 4 2 2 2\n2 3 2 4 7 0 7 2 0 4 0 0 0 0 7 0 4 7\n3 4 7 7 0 3 2 0 0 7 3 0 2 7 4 2 0 3\n2 8 0 3 3 0 0 2 2 0 7 7 3 0 2 2 2 3\n0 8 8 4 0 3 0 0 2 7 8 0 0 0 2 3 7 3\n0 8 4 3 0 7 2 0 3 0 8 8 0 4 0 2 3 3\n3 2 0 4 0 2 7 3 7 0 8 3 2 0 0 2 2 7\n2 2 3 3 4 3 7 7 2 2 4 0 0 0 4 2 3 2\n0 2 0 2 0 0 4 0 0 3 7 0 0 0 4 3 4 2\n0 4 3 0 0 3 0 0 7 0 0 0 2 3 3 7 4 3\n\nTraining Example 4:\nInput:\n2 3 2 8 4 4 0 2 3 0 2 4 7 7 3 7 3\n3 4 8 8 8 0 0 2 0 2 0 2 7 7 7 3 7\n7 3 0 8 0 2 2 0 2 2 0 7 3 0 3 3 3\n2 0 2 0 2 0 3 2 0 7 0 7 0 0 2 3 0\n7 7 4 3 7 2 0 2 3 0 3 4 7 2 0 3 7\n2 4 0 7 0 0 3 4 4 0 3 4 4 3 3 4 0\n3 2 7 3 7 3 7 2 0 2 3 2 3 3 3 4 4\n3 7 4 0 2 0 2 0 3 7 2 3 3 3 3 0 2\n3 2 3 2 0 2 0 2 0 7 2 0 2 4 4 7 3\n4 3 4 2 0 7 0 0 7 0 0 0 0 3 0 0 3\n2 3 0 0 4 0 2 0 3 3 2 0 4 0 0 2 2\n3 3 4 3 2 7 2 4 3 0 7 3 3 4 2 0 3\n2 0 7 7 0 3 7 4 3 7 0 2 0 3 7 0 2\n2 3 0 0 2 3 0 7 0 7 3 7 0 4 0 3 7\n2 0 2 2 7 2 0 0 2 2 3 0 0 3 7 0 3\n7 2 4 0 3 0 0 2 2 7 4 0 0 2 2 0 4\n0 0 3 0 4 4 7 7 4 2 0 0 3 7 0 2 0\n2 3 4 0 3 0 3 3 2 3 4 7 7 0 2 0 3\n\nOutput:\n2 3 2 8 4 4 0 2 3 0 2 4 7 7 3 7 3\n3 4 8 8 8 0 0 2 0 2 0 2 7 7 7 8 7\n7 3 0 8 0 2 2 0 2 2 0 7 3 0 8 8 8\n2 0 2 0 2 0 3 2 0 7 0 7 0 0 2 8 0\n7 7 4 3 7 2 0 2 3 0 3 4 7 2 0 3 7\n2 4 0 7 0 0 3 4 4 0 3 4 4 8 3 4 0\n3 2 7 3 7 3 7 2 0 2 3 2 8 8 8 4 4\n3 7 4 0 2 0 2 0 3 7 2 3 3 8 3 0 2\n3 2 3 2 0 2 0 2 0 7 2 0 2 4 4 7 3\n4 3 4 2 0 7 0 0 7 0 0 0 0 3 0 0 3\n2 3 0 0 4 0 2 0 3 3 2 0 4 0 0 2 2\n3 3 4 3 2 7 2 4 3 0 7 3 3 4 2 0 3\n2 0 7 7 0 3 7 4 3 7 0 2 0 3 7 0 2\n2 3 0 0 2 3 0 7 0 7 3 7 0 4 0 3 7\n2 0 2 2 7 2 0 0 2 2 3 0 0 3 7 0 3\n7 2 4 0 3 0 0 2 2 7 4 0 0 2 2 0 4\n0 0 3 0 4 4 7 7 4 2 0 0 3 7 0 2 0\n2 3 4 0 3 0 3 3 2 3 4 7 7 0 2 0 3\n\nTest Input:\n7 3 2 2 4 3 7 2 7 0 7 3 4 0 3 2 4\n0 2 2 2 2 3 0 3 3 0 3 2 0 0 3 0 7\n3 2 0 3 7 0 2 2 2 3 7 0 3 3 0 2 2\n4 2 7 7 0 0 2 0 0 0 7 4 3 2 3 7 2\n7 0 8 3 0 7 3 3 0 2 3 0 4 0 0 7 0\n3 4 8 8 3 2 0 0 3 4 2 4 0 3 3 2 4\n2 3 0 8 0 0 2 4 0 4 4 0 0 7 2 3 0\n2 4 0 3 0 0 2 2 3 2 7 3 3 7 0 4 0\n2 7 7 4 0 3 0 2 7 7 0 4 7 0 7 3 3\n0 0 7 3 4 0 2 3 0 7 4 3 2 3 0 7 3\n2 7 0 3 4 7 3 4 0 4 0 0 0 3 3 7 2\n4 3 0 2 3 0 4 0 4 3 3 2 2 3 3 0 3\n4 7 0 7 3 3 2 3 3 0 7 0 0 0 0 4 7\n3 3 3 3 0 4 3 4 4 7 3 7 0 0 0 3 0\n0 2 2 3 3 3 0 7 3 2 7 3 4 3 3 3 3\n3 3 3 4 7 4 3 3 3 0 0 4 0 7 0 4 3\n\nGive your answer in ... tags, space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 7, + 3, + 2, + 2, + 4, + 3, + 7, + 2, + 7, + 0, + 7, + 3, + 4, + 0, + 3, + 2, + 4 + ], + [ + 0, + 2, + 2, + 2, + 2, + 3, + 0, + 3, + 3, + 0, + 3, + 2, + 0, + 0, + 3, + 0, + 7 + ], + [ + 3, + 2, + 0, + 3, + 7, + 0, + 2, + 2, + 2, + 3, + 7, + 0, + 3, + 3, + 0, + 2, + 2 + ], + [ + 4, + 2, + 7, + 7, + 0, + 0, + 2, + 0, + 0, + 0, + 7, + 4, + 3, + 2, + 3, + 7, + 2 + ], + [ + 7, + 0, + 8, + 3, + 0, + 7, + 3, + 3, + 0, + 2, + 3, + 0, + 4, + 0, + 0, + 7, + 0 + ], + [ + 3, + 4, + 8, + 8, + 3, + 2, + 0, + 0, + 3, + 4, + 2, + 4, + 0, + 3, + 3, + 2, + 4 + ], + [ + 2, + 3, + 0, + 8, + 0, + 0, + 2, + 4, + 0, + 4, + 4, + 0, + 0, + 7, + 2, + 3, + 0 + ], + [ + 2, + 4, + 0, + 3, + 0, + 0, + 2, + 2, + 3, + 2, + 7, + 3, + 3, + 7, + 0, + 4, + 0 + ], + [ + 2, + 7, + 7, + 4, + 0, + 3, + 0, + 2, + 7, + 7, + 0, + 4, + 7, + 0, + 7, + 3, + 3 + ], + [ + 0, + 0, + 7, + 3, + 4, + 0, + 2, + 3, + 0, + 7, + 4, + 3, + 2, + 8, + 0, + 7, + 3 + ], + [ + 2, + 7, + 0, + 3, + 4, + 7, + 3, + 4, + 0, + 4, + 0, + 0, + 0, + 8, + 8, + 7, + 2 + ], + [ + 4, + 3, + 0, + 2, + 3, + 0, + 4, + 0, + 4, + 3, + 3, + 2, + 2, + 3, + 8, + 0, + 3 + ], + [ + 4, + 7, + 0, + 7, + 3, + 3, + 2, + 3, + 3, + 0, + 7, + 0, + 0, + 0, + 0, + 4, + 7 + ], + [ + 3, + 3, + 8, + 8, + 0, + 4, + 3, + 4, + 4, + 7, + 3, + 7, + 0, + 0, + 0, + 8, + 0 + ], + [ + 0, + 2, + 2, + 8, + 8, + 3, + 0, + 7, + 3, + 2, + 7, + 3, + 4, + 3, + 3, + 8, + 8 + ], + [ + 3, + 3, + 3, + 4, + 7, + 4, + 3, + 3, + 3, + 0, + 0, + 4, + 0, + 7, + 0, + 4, + 8 + ] + ] + ], + "num_test_pairs": 1, + "topic": "arc", + "source": "ARC1-Eval" + }, + { + "problem_id": "arc2_62593bfd", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n4 4 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 0 0 0 2 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 3 3 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 3 0 0 0 0 0 0 1 1 1 1 1 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 3 3 3 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 2 0 0 0 0 0 0 0 0 0 0\n4 4 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTraining Example 2:\nInput:\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 3 3 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 5 3 5 5 5 5 5\n5 5 5 5 5 5 1 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 3 3 5 5 5 5 5\n5 5 5 5 1 1 1 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 7 5 5 9 9 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 7 7 5 5 9 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 2 2 2 5 5 5 5 5 5 5 5 5 5 5 5 5 5 4 5 5 5 5 5 5 5 5\n5 5 5 5 2 5 2 2 5 5 5 5 5 5 5 5 5 5 5 5 5 4 5 5 5 5 5 5 5 5\n5 5 5 5 2 2 2 5 5 5 5 5 5 5 5 5 5 5 5 5 4 4 4 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n\nOutput:\n5 5 5 5 2 2 2 5 5 5 5 5 5 7 5 5 9 9 5 5 5 5 3 3 3 5 5 5 5 5\n5 5 5 5 2 5 2 2 5 5 5 5 7 7 5 5 9 5 5 5 5 5 3 5 3 5 5 5 5 5\n5 5 5 5 2 2 2 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 3 3 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 4 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 1 5 5 5 5 5 5 5 5 5 5 5 5 5 5 4 5 5 5 5 5 5 5 5\n5 5 5 5 1 1 1 5 5 5 5 5 5 5 5 5 5 5 5 5 4 4 4 5 5 5 5 5 5 5\n\nTest Input 1:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1 1 1 5 1 1 1 1 1\n1 1 1 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 5 5 5 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 5 1 5 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 5 5 5 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 5 1 1 1 5 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 3 1 1 1 3 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1 1\n1 1 1 1 1 3 3 3 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1 1\n1 1 1 1 1 3 1 3 1 1 1 1 1 1 1 1 1 1 3 3 3 1 1 1 1\n1 1 1 1 1 3 3 3 1 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1\n1 1 1 1 3 1 1 1 3 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 4 4 4 4 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTest Input 2:\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 3 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 3 9 3 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 4 4 4 9 9 9 9 9 3 9 9 9 9\n9 9 9 9 9 9 1 9 9 9 9 9 9 9 9 9 4 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 1 1 1 1 9 9 9 9 9 9 9 9 4 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 1 9 9 9 9 7 7 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 1 9 9 9 9 7 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 6 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 6 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 6 6 6 6 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 6 9 9 9 9 9\n9 9 8 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 8 8 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 1, + 1, + 1, + 1, + 1, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 5, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 5, + 5, + 5, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 3, + 1, + 1, + 1, + 1, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 5, + 1, + 5, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 5, + 5, + 5, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1, + 4, + 1, + 1, + 1, + 1, + 1, + 5, + 1, + 1, + 1, + 5, + 1 + ] + ], + [ + [ + 9, + 9, + 8, + 9, + 9, + 9, + 1, + 9, + 9, + 9, + 9, + 7, + 7, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 6, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 8, + 8, + 9, + 1, + 1, + 1, + 1, + 9, + 9, + 9, + 7, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 6, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 1, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 6, + 6, + 6, + 6, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 1, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 6, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4, + 4, + 4, + 9, + 9, + 9, + 9, + 9, + 3, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4, + 9, + 9, + 9, + 9, + 9, + 3, + 9, + 3, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4, + 9, + 9, + 9, + 9, + 9, + 9, + 3, + 9, + 9, + 9, + 9 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_2b83f449", + "problem_text": "ARC Puzzle: Predict the test output grid.\n\nTraining Example 1:\nInput:\n3 8 8 8 8 8 8 0 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 7 7 7 0 0 0 7 7 7 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 7 7 7 0 0 0 0 7 7 7 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 7 7 7 0 0 7 7 7 0 0 0 0 7 7 7 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 7 7 7 0 0 0 7 7 7 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 0 8 8 3\n0 0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 7 7 7 0 0 0 0 0 7 7 7 0 0 0 0\n8 8 0 8 8 8 8 8 0 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 6 8 8 0 8 8 6 8 8 8 8 8 8 8 8\n0 0 0 8 6 8 0 0 0 8 6 8 0 0 0 0 0 0 0\n3 3 8 8 6 8 6 8 8 8 6 8 8 6 8 8 8 8 8\n0 0 0 0 0 8 6 8 0 0 0 0 8 6 8 0 0 0 0\n8 8 8 6 8 8 6 8 6 8 8 8 8 6 8 6 8 8 8\n0 0 8 6 8 0 0 8 6 8 0 0 0 0 8 6 8 0 0\n3 3 8 6 8 6 8 8 6 8 8 6 8 8 8 6 8 3 3\n0 0 0 0 8 6 8 0 0 0 8 6 8 0 0 0 0 0 0\n3 8 8 8 8 6 8 8 6 8 8 6 8 8 3 0 8 8 3\n0 0 0 0 0 0 0 8 6 8 0 0 0 0 0 0 0 0 0\n8 8 8 8 8 6 8 8 6 8 8 8 8 6 8 8 8 8 8\n0 0 0 0 8 6 8 0 0 0 0 0 8 6 8 0 0 0 0\n8 8 0 3 8 6 8 8 0 3 8 8 8 6 8 8 8 8 3\n\nTraining Example 2:\nInput:\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 7 7 7 0 0 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 0 0 7 7 7 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 7 7 7 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 7 7 7 0 0 0 0 0 7 7 7 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 6 8 8 8 8 8 8 8 8 8 8 8\n0 0 0 8 6 8 0 0 0 0 0 0 0 0 0 0\n3 3 8 8 6 8 8 8 8 8 8 8 6 8 8 8\n0 0 0 0 0 0 0 0 0 0 0 8 6 8 0 0\n8 8 8 8 8 8 6 8 8 8 8 8 6 8 3 3\n0 0 0 0 0 8 6 8 0 0 0 0 0 0 0 0\n8 8 8 6 8 8 6 8 8 8 8 6 8 8 8 8\n0 0 8 6 8 0 0 0 0 0 8 6 8 0 0 0\n3 3 8 6 8 8 8 6 8 8 8 6 8 8 3 3\n0 0 0 0 0 0 8 6 8 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 6 8 8 8 8 8 8 8 3\n\nTest Input:\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 7 7 7 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 0 0 0 7 7 7 0 0\n3 8 8 8 8 8 8 0 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 7 7 7 0 0 0 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 0 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 7 7 7 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 7 7 7 0 0 0 0 0 0 7 7 7 0 0 0\n8 8 8 8 8 8 8 0 8 8 8 8 8 8 8 8 8\n\nGive your answer in ... tags, space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0 + ], + [ + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 6, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0 + ], + [ + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 0, + 3, + 8, + 8, + 8, + 8, + 6, + 8, + 3, + 3 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3 + ], + [ + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 3, + 3, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 3, + 0, + 8, + 8, + 8, + 8, + 8, + 3 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 3, + 3 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0 + ], + [ + 3, + 8, + 8, + 6, + 8, + 8, + 3, + 0, + 3, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 3 + ] + ] + ], + "num_test_pairs": 1, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_88bcf3b4", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0\n0 0 0 0 0 2 0\n0 0 0 0 0 0 0\n0 0 0 4 4 8 0\n0 0 0 4 0 8 0\n0 0 4 4 0 8 0\n0 4 0 0 0 8 0\n\nOutput:\n0 0 0 0 0 4 0\n0 0 0 0 4 2 0\n0 0 0 0 4 0 0\n0 0 0 0 4 8 0\n0 0 0 0 0 8 0\n0 0 0 0 0 8 0\n0 0 0 0 0 8 0\n\nTraining Example 2:\nInput:\n7 7 7 7 4 7 7 7 7 7 7 7\n7 7 7 7 4 7 7 7 7 7 7 7\n7 7 7 7 4 7 7 7 7 7 7 7\n7 7 7 7 7 7 7 7 7 7 7 7\n7 7 7 7 7 7 7 7 7 7 7 7\n7 7 7 7 7 7 3 2 7 7 7 7\n7 7 7 7 7 3 7 2 7 7 7 7\n7 7 7 7 7 3 7 2 7 7 7 7\n7 7 7 3 3 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n\nOutput:\n7 7 7 7 4 7 7 7 7 7 7 7\n7 7 7 3 4 7 7 7 7 7 7 7\n7 7 7 3 4 7 7 7 7 7 7 7\n7 7 7 7 3 7 7 7 7 7 7 7\n7 7 7 7 7 3 7 7 7 7 7 7\n7 7 7 7 7 7 3 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n\nTraining Example 3:\nInput:\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 7 7 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 7 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 7 7 1 1 1 1\n1 1 1 1 1 1 2 1 7 7 7 1 1 1 1 1 1\n1 1 1 1 1 1 2 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 7 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 7 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 7 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 7 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 7 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 7 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 7 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTraining Example 4:\nInput:\n0 0 0 0 0 0 0 0 0 0\n0 0 0 3 0 0 0 0 0 0\n0 0 3 0 0 0 0 0 0 0\n0 0 0 3 0 0 0 0 0 0\n0 0 0 8 5 0 0 0 0 0\n0 0 0 8 5 0 0 0 0 0\n0 0 8 0 5 0 0 0 0 0\n0 0 8 0 5 0 0 0 0 0\n0 8 8 0 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n\nOutput:\n0 0 0 8 0 0 0 0 0 0\n0 0 8 3 0 0 0 0 0 0\n0 8 3 0 0 0 0 0 0 0\n0 0 8 3 0 0 0 0 0 0\n0 0 0 8 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n\nTraining Example 5:\nInput:\n0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0\n0 0 0 3 0 0 0 0 0\n0 0 0 3 0 0 0 0 0\n0 0 0 0 0 0 0 0 0\n0 0 0 0 9 6 0 0 0\n0 0 0 9 0 6 0 0 0\n9 9 9 0 0 6 0 0 0\n9 0 0 0 0 6 0 0 0\n\nOutput:\n0 0 0 0 9 0 0 0 0\n0 0 0 9 0 0 0 0 0\n0 0 9 3 0 0 0 0 0\n0 0 9 3 0 0 0 0 0\n0 0 0 9 0 0 0 0 0\n0 0 0 0 9 6 0 0 0\n0 0 0 0 0 6 0 0 0\n0 0 0 0 0 6 0 0 0\n0 0 0 0 0 6 0 0 0\n\nTest Input 1:\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 8 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 8 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 8 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 8 5 5 5 5 5 5 5 9 9 5 5 5 5 5 5 5 5 5 5\n5 5 5 8 5 5 5 5 5 5 9 9 9 5 5 5 5 5 5 5 5 5\n5 5 5 5 8 5 5 5 5 5 9 9 9 9 5 5 5 5 5 5 5 5\n5 5 5 5 5 8 8 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n3 3 3 3 3 3 3 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 4 4 1 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 4 4 4 5 5 1 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 4 5 5 5 5 5 1 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 1 5 5 5 5 5 5 5 5 5 5 5 5 5\n\nTest Input 2:\n8 8 8 8 8 8 8 8 8 8 8 8 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 1 1 8 8 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 1 8 8 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 1 1 1 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 1 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 2 2 2 2 2\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 5 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 6 8 8 8 8 5 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 6 8 8 8 5 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 5 5 8 8 8\n8 8 8 8 5 5 5 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 5 5 8 8\n8 8 8 8 5 5 5 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 4 4 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 4 4 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 8, + 8, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 8, + 9, + 9, + 8, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 8, + 5, + 9, + 9, + 9, + 8, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 8, + 5, + 5, + 9, + 9, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 8, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ] + ], + [ + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 5, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 5, + 6, + 6, + 8, + 8, + 5, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 5, + 6, + 6, + 5, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 5, + 5, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 4, + 5, + 5, + 5, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 4, + 5, + 5, + 5, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 4, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_8b7bacbf", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 0 0\n0 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 5 0\n2 0 0 2 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 5 0 0 5 0\n2 0 0 2 0 0 0 0 2 0 0 2 0 0 0 0 0 0 0 1 5 5 1 0\n0 2 2 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 1 0 0 0 1 0\n0 0 0 0 1 1 1 1 1 2 2 1 0 0 0 0 2 0 2 2 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 2 0 0 0 0 2 0 1 0\n0 0 0 0 0 0 1 1 1 1 1 0 0 0 0 0 2 0 0 2 2 0 1 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 1 2 2 0 0 0 1 0\n0 0 0 1 1 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 3 3 0 0 0 0 0 0 0 1 0 0 0 0 0 1 0\n0 0 0 0 0 0 3 0 0 3 0 0 0 2 2 1 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 3 0 0 3 0 0 2 0 0 2 0 0 0 0 0 0 1 0\n0 0 0 1 0 0 1 3 3 1 1 1 2 0 0 2 0 0 0 0 0 0 1 0\n0 0 0 1 1 1 0 0 0 0 0 2 0 0 0 2 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 2 0 0 2 0 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 7\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 0 0\n0 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 7 7 5 0\n2 0 0 2 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 5 7 7 5 0\n2 0 0 2 0 0 0 0 2 0 0 2 0 0 0 0 0 0 0 1 5 5 1 0\n0 2 2 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 1 0 0 0 1 0\n0 0 0 0 1 1 1 1 1 2 2 1 0 0 0 0 2 7 2 2 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 2 7 7 7 7 2 0 1 0\n0 0 0 0 0 0 1 1 1 1 1 0 0 0 0 0 2 7 7 2 2 0 1 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 1 2 2 0 0 0 1 0\n0 0 0 1 1 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 3 3 0 0 0 0 0 0 0 1 0 0 0 0 0 1 0\n0 0 0 0 0 0 3 7 7 3 0 0 0 2 2 1 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 3 7 7 3 0 0 2 7 7 2 0 0 0 0 0 0 1 0\n0 0 0 1 0 0 1 3 3 1 1 1 2 7 7 2 0 0 0 0 0 0 1 0\n0 0 0 1 1 1 0 0 0 0 0 2 7 7 7 2 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 2 7 7 2 0 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 7\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 2 2 0 0\n0 0 0 2 2 0 2 0 0 2 0 0 0 0 0 2 0 0 2 0\n0 0 2 0 0 2 2 0 0 2 0 0 2 2 0 2 0 0 2 0\n0 0 2 0 0 2 1 2 2 0 0 2 0 0 2 0 2 2 1 0\n0 0 0 2 2 1 1 1 0 0 0 2 0 0 2 0 0 1 0 0\n0 0 0 1 0 0 0 0 1 1 0 0 2 2 0 0 1 0 0 0\n0 0 0 1 0 0 0 0 0 1 1 0 0 0 0 1 0 0 0 0\n0 0 1 1 0 0 0 0 0 0 1 1 0 0 1 0 0 0 0 0\n0 0 1 0 0 0 0 0 0 0 0 1 1 1 0 0 0 2 2 0\n1 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 2\n4 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 2\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 2 2 0 0\n0 0 0 2 2 0 2 4 4 2 0 0 0 0 0 2 4 4 2 0\n0 0 2 4 4 2 2 4 4 2 0 0 2 2 0 2 4 4 2 0\n0 0 2 4 4 2 1 2 2 0 0 2 0 0 2 0 2 2 1 0\n0 0 0 2 2 1 1 1 0 0 0 2 0 0 2 0 0 1 0 0\n0 0 0 1 0 0 0 0 1 1 0 0 2 2 0 0 1 0 0 0\n0 0 0 1 0 0 0 0 0 1 1 0 0 0 0 1 0 0 0 0\n0 0 1 1 0 0 0 0 0 0 1 1 0 0 1 0 0 0 0 0\n0 0 1 0 0 0 0 0 0 0 0 1 1 1 0 0 0 2 2 0\n1 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 2\n4 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 2\n\nTraining Example 3:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2\n0 0 2 2 0 0 0 0 0 0 0 2 2 0 0 0 0 2 0 0\n0 2 0 0 2 0 0 0 0 0 2 0 0 2 0 0 0 2 0 0\n0 2 0 0 2 0 0 0 0 0 2 0 0 2 0 0 0 3 2 2\n0 1 2 2 1 1 1 1 1 1 1 2 2 1 0 0 0 3 0 0\n0 1 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 3 0 0\n0 0 1 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 3 0\n1 1 0 0 0 0 0 2 2 1 1 1 0 0 0 0 2 2 3 0\n0 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 0 0 2 0\n1 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 0 0 2 0\n0 0 0 0 0 0 1 2 2 0 0 0 0 0 0 3 2 2 0 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 3 0 0 0 0\n0 0 0 0 1 0 0 0 0 0 0 3 3 2 2 3 0 0 0 0\n0 0 2 2 1 0 0 0 0 0 3 0 2 0 0 2 0 0 0 0\n0 2 0 0 2 0 0 0 3 3 3 0 2 0 0 2 0 0 0 0\n0 2 0 0 2 0 0 0 3 4 3 0 0 2 2 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2\n0 0 2 2 0 0 0 0 0 0 0 2 2 0 0 0 0 2 4 4\n0 2 0 0 2 0 0 0 0 0 2 0 0 2 0 0 0 2 4 4\n0 2 0 0 2 0 0 0 0 0 2 0 0 2 0 0 0 3 2 2\n0 1 2 2 1 1 1 1 1 1 1 2 2 1 0 0 0 3 0 0\n0 1 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 3 0 0\n0 0 1 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 3 0\n1 1 0 0 0 0 0 2 2 1 1 1 0 0 0 0 2 2 3 0\n0 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 4 4 2 0\n1 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 4 4 2 0\n0 0 0 0 0 0 1 2 2 0 0 0 0 0 0 3 2 2 0 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 3 0 0 0 0\n0 0 0 0 1 0 0 0 0 0 0 3 3 2 2 3 0 0 0 0\n0 0 2 2 1 0 0 0 0 0 3 0 2 4 4 2 0 0 0 0\n0 2 0 0 2 0 0 0 3 3 3 0 2 4 4 2 0 0 0 0\n0 2 0 0 2 0 0 0 3 4 3 0 0 2 2 0 0 0 0 0\n\nTraining Example 4:\nInput:\n0 0 2 2 0 0 0 0\n0 2 0 0 2 0 0 0\n0 2 0 0 2 0 0 0\n0 0 2 2 0 1 0 0\n0 0 0 0 0 0 1 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 0 1 1\n0 0 0 0 0 0 1 4\n\nOutput:\n0 0 2 2 0 0 0 0\n0 2 4 4 2 0 0 0\n0 2 4 4 2 0 0 0\n0 0 2 2 0 1 0 0\n0 0 0 0 0 0 1 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 0 1 1\n0 0 0 0 0 0 1 4\n\nTest Input 1:\n6 1 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 8\n1 1 1 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 3\n5 5 5 1 9 9 1 1 1 1 1 1 1 9 9 9 9 9 9 9 5 5 5 5 5 5 3 3 5 5\n5 5 5 9 5 5 9 5 5 5 5 5 9 5 5 5 5 5 5 5 9 5 5 5 5 5 3 5 5 5\n5 5 5 9 5 5 9 5 5 5 5 5 9 5 5 5 5 5 5 5 9 5 5 5 5 3 3 5 5 5\n5 5 5 5 9 9 5 5 5 5 5 5 5 9 9 9 9 9 9 9 1 1 1 1 5 3 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 1 3 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 1 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 5 5 1 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 9 3 5 5 1 5 5\n5 5 5 5 9 9 9 9 9 9 9 5 5 5 5 5 9 3 3 5 5 9 5 5 9 5 5 1 5 5\n5 5 5 9 5 5 5 5 5 5 5 9 5 5 5 9 9 9 3 3 3 9 5 5 9 5 5 1 5 5\n5 5 5 9 5 5 5 5 5 5 5 9 5 5 5 9 5 9 5 5 3 3 9 9 5 5 5 1 1 5\n5 5 3 3 9 9 9 9 9 9 9 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 5 5 1 5\n5 0 3 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 5 5 1 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 5 1 1 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 5 1 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 5 1 5 5\n5 5 0 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 1 1 5 5\n5 5 3 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 1 5 5 5\n5 5 3 5 5 5 5 5 5 5 5 5 5 3 3 3 9 5 5 5 5 5 5 5 5 1 1 5 5 5\n5 5 3 3 5 5 5 5 5 5 3 3 3 3 5 5 5 5 5 5 9 9 9 1 1 1 5 5 5 5\n5 5 5 3 9 9 3 3 3 3 3 5 5 5 5 5 5 5 5 9 5 5 9 1 1 5 5 5 5 5\n5 5 5 9 5 5 9 5 5 5 5 5 5 5 5 5 5 5 9 5 5 5 9 5 5 5 5 5 5 5\n5 5 5 9 5 5 9 5 5 5 5 5 5 5 5 5 5 9 5 5 5 9 5 5 5 5 5 5 5 5\n5 5 5 5 9 9 5 5 5 5 5 5 5 5 5 5 9 5 5 5 9 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 5 5 5 9 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 9 9 9 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n\nTest Input 2:\n0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 0 0 0 0 0 0 0 0 8 8 0\n0 0 0 0 0 0 0 1 1 0 0 0 0 0 1 1 1 0 0 0 0 0 8 0 0 8\n0 0 0 0 2 2 1 1 0 0 0 0 0 0 0 0 1 1 8 8 0 0 8 0 0 8\n0 0 0 2 0 0 2 0 0 0 0 0 0 0 0 0 0 8 0 0 8 0 0 8 8 0\n0 0 0 2 0 0 2 0 0 0 0 0 0 0 0 0 0 8 0 0 8 0 0 0 0 0\n0 0 0 1 2 2 1 0 0 0 0 0 0 0 0 0 0 0 8 8 1 0 0 0 0 0\n0 0 1 1 0 0 1 1 6 6 6 0 0 0 0 0 0 0 0 0 0 1 1 1 0 0\n0 0 1 0 0 0 0 6 0 0 0 6 0 0 0 8 8 0 0 0 0 0 0 0 1 0\n0 0 1 0 0 0 0 6 0 0 0 6 0 0 8 0 0 8 0 0 0 5 5 5 1 0\n0 0 1 0 0 0 0 6 0 0 0 6 0 0 8 0 0 8 0 0 5 0 0 0 5 0\n0 0 1 0 0 0 0 0 6 6 6 0 0 9 9 8 8 9 0 0 5 0 0 0 5 0\n0 0 1 0 0 0 0 0 0 0 0 0 9 0 0 0 0 9 9 0 0 5 5 5 0 0\n0 0 1 0 0 0 0 0 8 8 9 9 0 0 0 0 0 0 9 0 0 0 0 0 0 0\n0 0 1 0 0 0 0 8 0 0 8 0 0 0 0 0 0 0 9 0 0 0 0 0 0 0\n0 0 1 0 0 0 0 8 0 0 8 0 0 0 0 0 0 0 9 0 0 0 0 0 0 0\n0 0 1 0 0 0 0 0 8 8 0 0 0 0 0 0 0 0 9 0 0 0 8 8 0 0\n0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 8 8 9 0 0 8 0 0 8 0\n0 1 1 0 0 0 0 0 0 0 0 0 0 0 0 8 0 0 8 0 0 8 0 0 8 0\n0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 8 0 0 8 0 0 9 8 8 0 0\n0 1 0 0 0 0 0 9 9 9 9 0 0 0 0 9 8 8 9 9 9 0 0 0 0 0\n1 1 0 0 9 9 9 0 0 0 9 9 9 9 9 9 0 0 0 0 0 0 0 0 0 0\n4 1 0 0 9 3 9 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 6, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 8 + ], + [ + 1, + 1, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 3 + ], + [ + 5, + 5, + 5, + 1, + 9, + 9, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 3, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 3, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 3, + 3, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 1, + 1, + 1, + 1, + 5, + 3, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 3, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 1, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 9, + 3, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 9, + 3, + 3, + 5, + 5, + 9, + 8, + 8, + 9, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 5, + 5, + 5, + 9, + 9, + 9, + 3, + 3, + 3, + 9, + 8, + 8, + 9, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 3, + 3, + 9, + 9, + 5, + 5, + 5, + 1, + 1, + 5 + ], + [ + 5, + 5, + 3, + 3, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5 + ], + [ + 5, + 0, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 1, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 0, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 1, + 5, + 5 + ], + [ + 5, + 5, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5, + 5 + ], + [ + 5, + 5, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 3, + 3, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 1, + 5, + 5, + 5 + ], + [ + 5, + 5, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 9, + 9, + 1, + 1, + 1, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 3, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 9, + 1, + 1, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 8, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 8, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 9, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ] + ], + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 8, + 0, + 0, + 8 + ], + [ + 0, + 0, + 0, + 0, + 2, + 2, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 8, + 8, + 0, + 0, + 8, + 0, + 0, + 8 + ], + [ + 0, + 0, + 0, + 2, + 4, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 4, + 4, + 8, + 0, + 0, + 8, + 8, + 0 + ], + [ + 0, + 0, + 0, + 2, + 4, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 4, + 4, + 8, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 1, + 2, + 2, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 1, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 1, + 0, + 0, + 1, + 1, + 6, + 6, + 6, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 6, + 4, + 4, + 4, + 6, + 0, + 0, + 0, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 6, + 4, + 4, + 4, + 6, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 0, + 5, + 5, + 5, + 1, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 6, + 4, + 4, + 4, + 6, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 5, + 4, + 4, + 4, + 5, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 0, + 0, + 9, + 9, + 8, + 8, + 9, + 0, + 0, + 5, + 4, + 4, + 4, + 5, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 0, + 0, + 5, + 5, + 5, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 9, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 9, + 0, + 0, + 0, + 8, + 8, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 9, + 0, + 0, + 8, + 3, + 3, + 8, + 0 + ], + [ + 0, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 8, + 3, + 3, + 8, + 0 + ], + [ + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 9, + 8, + 8, + 0, + 0 + ], + [ + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 8, + 8, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 0, + 0, + 9, + 9, + 9, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 4, + 1, + 0, + 0, + 9, + 3, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_faa9f03d", + "problem_text": "ARC Puzzle: Predict the test output grid.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0 0 0 3 0 0\n1 1 1 1 0 0 0 0 0 3 0 0\n0 0 0 1 0 0 0 0 0 3 0 0\n2 3 3 3 2 0 0 0 0 3 0 0\n0 0 0 1 3 0 0 0 0 3 0 0\n0 0 0 1 3 1 1 0 0 3 0 0\n0 0 0 0 3 0 1 0 0 3 0 0\n0 0 0 0 3 0 1 0 0 3 0 0\n0 0 0 0 2 3 3 3 0 2 0 0\n0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 1 1 0 1 1 0\n0 0 0 0 0 0 0 0 0 0 1 1\n\nOutput:\n0 0 0 0 0 0 0 0 0 3 0 0\n1 1 1 1 0 0 0 0 0 3 0 0\n0 0 0 1 0 0 0 0 0 3 0 0\n3 3 3 1 3 0 0 0 0 3 0 0\n0 0 0 1 3 0 0 0 0 3 0 0\n0 0 0 1 1 1 1 0 0 3 0 0\n0 0 0 0 3 0 1 0 0 3 0 0\n0 0 0 0 3 0 1 0 0 3 0 0\n0 0 0 0 3 3 1 3 3 3 0 0\n0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 1 1 1 1 1 0\n0 0 0 0 0 0 0 0 0 0 1 1\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 0 7 0\n7 7 7 7 0 0 0 0 0 0 7 0\n3 3 3 3 3 0 3 3 3 4 7 0\n0 0 0 7 0 0 0 0 3 0 7 0\n0 0 0 0 0 0 0 0 0 0 7 0\n0 0 0 7 7 7 7 0 3 0 0 0\n0 0 0 0 0 0 7 0 3 0 7 0\n0 0 7 7 7 7 7 0 3 0 7 0\n0 0 7 0 0 0 0 0 3 0 7 0\n3 3 0 3 3 3 3 3 3 0 7 0\n0 0 7 7 7 7 7 7 7 7 7 0\n0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 7 0\n7 7 7 7 0 0 0 0 0 0 7 0\n0 0 0 7 0 0 0 0 3 3 3 3\n0 0 0 7 0 0 0 0 3 0 7 0\n0 0 0 7 0 0 0 0 3 0 7 0\n0 0 0 7 7 7 7 0 3 0 7 0\n0 0 0 0 0 0 7 0 3 0 7 0\n0 0 7 7 7 7 7 0 3 0 7 0\n0 0 7 0 0 0 0 0 3 0 7 0\n3 3 3 3 3 3 3 3 3 0 7 0\n0 0 7 7 7 7 7 7 7 7 7 0\n0 0 0 0 0 0 0 0 0 0 0 0\n\nTraining Example 3:\nInput:\n0 0 7 0 3 0 6 0 0 2 0 0\n0 0 7 0 0 0 0 0 0 1 0 0\n0 0 7 0 3 0 6 0 0 1 0 0\n3 3 7 3 2 0 6 0 0 1 0 0\n0 0 7 0 0 0 6 0 6 1 6 6\n0 0 7 0 0 0 0 0 0 1 0 0\n7 0 7 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 1 0 0\n0 0 0 0 2 1 1 1 1 2 0 0\n0 0 0 0 1 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 1 0 0 0 0 0 0 0\n\nOutput:\n0 0 7 0 3 0 6 0 0 1 0 0\n0 0 7 0 3 0 6 0 0 1 0 0\n0 0 7 0 3 0 6 0 0 1 0 0\n3 3 3 3 3 0 6 0 0 1 0 0\n0 0 7 0 0 0 6 6 6 6 6 6\n0 0 7 0 0 0 0 0 0 1 0 0\n7 7 7 0 0 0 0 0 0 1 0 0\n0 0 0 0 0 0 0 0 0 1 0 0\n0 0 0 0 1 1 1 1 1 1 0 0\n0 0 0 0 1 0 0 0 0 0 0 0\n0 0 0 0 1 0 0 0 0 0 0 0\n0 0 0 0 1 0 0 0 0 0 0 0\n\nTraining Example 4:\nInput:\n0 1 0 0 0 0 1 0 0 0 6 0\n0 1 0 0 0 0 1 0 0 0 6 0\n6 1 6 6 6 6 0 6 0 6 6 0\n0 1 0 0 0 0 1 0 0 0 4 0\n0 0 0 0 0 0 1 0 0 0 0 0\n0 1 1 1 0 1 1 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 1 0 0 0 0 1 0 0 0 0 0\n0 1 0 0 0 0 1 0 0 0 0 0\n6 1 6 6 6 6 1 6 6 6 6 0\n0 1 0 0 0 0 1 0 0 0 6 0\n0 1 0 0 0 0 1 0 0 0 6 0\n0 1 1 1 1 1 1 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n\nTest Input:\n0 0 0 0 7 0 0 0 0 0 7 0\n0 0 0 0 7 0 0 0 0 0 7 0\n0 0 0 0 7 0 0 0 0 0 7 0\n4 2 7 7 2 0 0 2 7 7 2 0\n0 7 0 0 0 0 0 7 0 0 4 0\n0 7 0 0 0 0 0 7 0 0 0 0\n0 7 0 0 0 0 0 7 0 0 0 0\n6 6 6 6 6 6 6 0 6 6 6 6\n0 7 0 0 0 0 0 7 0 0 0 0\n0 2 7 7 7 7 7 2 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n\nGive your answer in ... tags, space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 0 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 7, + 0 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 7, + 0 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 7, + 0 + ], + [ + 6, + 7, + 6, + 6, + 6, + 6, + 6, + 7, + 6, + 6, + 7, + 6 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 7, + 0 + ], + [ + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 7, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0 + ] + ] + ], + "num_test_pairs": 1, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_269e22fb", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n7 7 8 8 8 8 8 8 8 8\n7 7 7 7 7 7 8 8 8 8\n7 7 7 7 7 7 7 8 8 8\n7 7 8 8 8 7 7 7 8 8\n8 8 8 8 8 8 7 7 7 8\n8 8 8 8 8 8 8 7 7 7\n8 8 8 8 8 8 8 8 7 7\n8 8 8 8 8 8 8 8 8 7\n\nOutput:\n7 7 8 8 8 8 8 8 8 8 8 8 8 8 8 7 7 8 8 8\n7 7 7 7 7 7 8 8 8 8 8 8 8 8 8 7 7 8 8 8\n7 7 7 7 7 7 7 8 8 8 8 8 8 8 8 7 7 7 8 8\n7 7 8 8 8 7 7 7 8 8 8 8 8 8 8 7 7 7 8 8\n8 8 8 8 8 8 7 7 7 8 8 8 8 8 7 7 7 7 7 8\n8 8 8 8 8 8 8 7 7 7 8 8 8 8 7 8 8 7 7 8\n8 8 8 8 8 8 8 8 7 7 8 8 7 7 7 8 8 7 7 8\n8 8 8 8 8 8 8 8 8 7 8 8 7 8 7 8 8 7 7 8\n8 8 8 8 8 8 8 8 8 7 7 7 7 8 7 8 8 7 7 8\n8 7 7 7 7 7 7 7 7 7 8 7 7 8 7 8 8 7 7 8\n8 7 8 8 8 8 8 8 8 7 7 7 7 8 7 8 8 7 7 8\n8 7 7 7 7 7 7 7 7 7 8 8 7 8 7 8 8 7 7 8\n8 7 8 7 8 8 8 8 8 7 8 8 7 7 7 8 8 7 7 8\n7 7 7 8 7 7 7 7 7 7 8 8 8 8 7 8 8 7 7 8\n8 7 8 7 7 8 8 8 8 7 8 8 8 8 7 7 7 7 7 8\n7 7 7 8 7 8 8 8 8 7 8 8 8 7 7 8 7 7 8 8\n8 7 8 7 7 8 8 8 8 7 8 8 8 7 8 8 8 7 7 8\n7 7 7 8 7 8 8 8 8 7 8 8 8 7 7 8 8 8 7 7\n8 7 8 7 7 8 8 8 7 8 7 8 8 8 7 8 7 7 7 8\n7 7 7 8 8 8 8 7 8 8 8 7 8 8 7 7 7 8 8 8\n\nTraining Example 2:\nInput:\n8 8 7 8 8 8 7 8\n8 8 8 7 8 7 8 8\n7 8 8 8 7 8 8 8\n7 8 8 8 7 8 8 8\n7 8 8 8 7 8 8 8\n8 8 8 8 7 8 8 8\n8 8 8 8 7 7 7 7\n7 7 8 8 7 8 8 8\n8 7 8 8 7 7 7 7\n8 7 7 7 7 8 8 8\n8 7 7 8 7 7 7 7\n8 7 7 7 7 8 8 8\n8 7 8 8 7 8 8 8\n7 7 8 8 7 7 8 8\n8 8 8 8 7 7 7 8\n8 8 8 8 8 7 7 7\n\nOutput:\n8 8 8 7 7 7 8 8 7 8 8 8 7 8 8 8 8 7 7 7\n8 7 7 7 8 7 8 8 8 7 8 7 8 8 8 7 7 8 7 8\n7 7 8 8 8 7 7 8 8 8 7 8 8 8 8 7 8 7 7 7\n8 7 7 8 8 8 7 8 8 8 7 8 8 8 8 7 7 8 7 8\n8 8 7 7 8 7 7 8 8 8 7 8 8 8 8 7 8 7 7 7\n8 7 7 7 7 7 8 8 8 8 7 8 8 8 8 7 7 8 7 8\n8 7 7 8 8 7 8 8 8 8 7 7 7 7 7 7 8 7 7 7\n8 7 7 8 8 7 7 7 8 8 7 8 8 8 8 8 7 8 7 8\n8 7 7 8 8 7 8 7 8 8 7 7 7 7 7 7 7 7 7 8\n8 7 7 8 8 7 8 7 7 7 7 8 8 8 8 8 8 8 7 8\n8 7 7 8 8 7 8 7 7 8 7 7 7 7 7 7 7 7 7 8\n8 7 7 8 8 7 8 7 7 7 7 8 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 8 7 8 8 7 8 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 7 7 8 8 7 7 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 8 8 8 8 7 7 7 8 8 8 8 8 8 8\n8 7 7 7 7 7 8 8 8 8 8 7 7 7 8 8 8 8 8 8\n8 8 7 7 7 8 8 8 8 8 8 8 7 7 7 8 8 8 7 7\n8 8 7 7 7 8 8 8 8 8 8 8 8 7 7 7 7 7 7 7\n8 8 8 7 7 8 8 8 8 8 8 8 8 8 7 7 7 7 7 7\n8 8 8 7 7 8 8 8 8 8 8 8 8 8 8 8 8 8 7 7\n\nTraining Example 3:\nInput:\n0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 3 3 3 3 3\n0 0 3 3 3 3 3 3 3 3\n3 3 3 3 3 0 0 0 0 0\n3 3 3 3 3 0 0 0 0 0\n0 0 0 0 3 3 3 3 3 3\n0 0 0 0 0 0 3 0 0 0\n0 0 0 0 0 0 3 3 3 3\n0 0 0 0 0 0 0 0 3 3\n0 0 0 0 0 0 0 0 3 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 3 0 0\n0 0 0 0 3 3 3 3 3 3 3 3 3 3 3 0 3 3 3 0\n0 0 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 0 3 0\n3 3 3 3 3 0 0 0 0 0 0 0 0 0 3 3 0 0 3 3\n3 3 3 3 3 0 0 0 0 0 0 0 0 0 3 0 0 0 0 3\n0 0 0 0 3 3 3 3 3 3 3 3 3 3 3 3 0 3 3 3\n0 0 0 0 0 0 3 0 0 0 0 0 3 0 0 3 3 3 0 0\n0 0 0 0 0 0 3 3 3 3 3 3 3 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 3 3 3 0 0 0 0 0 0 0 0 3\n0 0 0 0 0 0 0 0 3 0 3 0 0 0 0 0 0 0 3 0\n0 0 0 0 0 3 3 3 3 3 3 3 3 3 3 3 3 3 0 0\n0 0 0 0 3 3 3 0 0 3 0 3 0 3 0 0 0 0 3 0\n0 0 0 3 3 3 0 0 0 3 0 3 0 3 0 0 0 0 0 3\n0 0 3 3 3 0 0 0 0 3 0 3 0 3 0 0 0 0 0 0\n0 3 3 3 0 0 0 0 0 3 0 3 0 3 0 0 0 0 0 0\n0 3 3 0 0 0 0 0 0 3 0 3 0 3 3 3 3 3 3 0\n0 3 3 0 0 0 0 0 0 3 0 3 3 0 3 0 3 0 3 0\n0 3 3 0 0 0 0 0 0 3 0 3 0 3 0 3 0 3 0 3\n3 3 3 3 0 0 0 0 0 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 0 0 0 0 0 0 0 0 0 3 0 3 0 3 0 3\n\nTraining Example 4:\nInput:\n8 8 7 7 7 8 8 8 8 8 8 8\n8 8 7 7 7 8 8 8 8 8 8 8\n8 7 7 7 7 7 8 8 8 8 8 7\n8 7 7 8 8 7 8 8 8 8 7 7\n8 7 7 8 8 7 7 7 8 8 7 7\n8 7 7 8 8 7 8 7 8 8 7 8\n8 7 7 8 8 7 8 7 7 7 7 8\n8 7 7 8 8 7 8 7 7 8 7 7\n8 7 7 8 8 7 8 7 7 7 7 8\n8 7 7 8 8 7 8 7 8 8 7 7\n8 7 7 8 8 7 7 7 8 8 7 8\n8 7 7 8 8 7 8 8 8 8 7 7\n8 7 7 7 7 7 8 8 8 8 7 8\n\nOutput:\n8 8 8 7 7 8 8 8 8 8 8 8 8 8 8 8 8 8 7 7\n8 8 8 7 7 8 8 8 8 8 8 8 8 8 7 7 7 7 7 7\n8 8 7 7 7 8 8 8 8 8 8 8 8 7 7 7 7 7 7 7\n8 8 7 7 7 8 8 8 8 8 8 8 7 7 7 8 8 8 7 7\n8 7 7 7 7 7 8 8 8 8 8 7 7 7 8 8 8 8 8 8\n8 7 7 8 8 7 8 8 8 8 7 7 7 8 8 8 8 8 8 8\n8 7 7 8 8 7 7 7 8 8 7 7 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 8 7 8 8 7 8 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 8 7 7 7 7 8 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 8 7 7 8 7 7 7 7 7 7 7 7 7 8\n8 7 7 8 8 7 8 7 7 7 7 8 8 8 8 8 8 8 7 8\n8 7 7 8 8 7 8 7 8 8 7 7 7 7 7 7 7 7 7 8\n8 7 7 8 8 7 7 7 8 8 7 8 8 8 8 8 7 8 7 8\n8 7 7 8 8 7 8 8 8 8 7 7 7 7 7 7 8 7 7 7\n8 7 7 7 7 7 8 8 8 8 7 8 8 8 8 7 7 8 7 8\n8 8 7 7 8 7 7 8 8 8 7 8 8 8 8 7 8 7 7 7\n8 7 7 8 8 8 7 8 8 8 7 8 8 8 8 7 7 8 7 8\n7 7 8 8 8 7 7 8 8 8 7 8 8 8 8 7 8 7 7 7\n8 7 7 7 8 7 8 8 8 7 8 7 8 8 8 7 7 8 7 8\n8 8 8 7 7 7 8 8 7 8 8 8 7 8 8 8 8 7 7 7\n\nTraining Example 5:\nInput:\n8 7 8 7 8 8 8 8 8 7\n8 7 8 7 8 8 8 8 8 8\n8 7 8 7 8 8 8 8 8 8\n8 7 8 7 7 7 7 7 7 8\n8 7 7 8 7 8 7 8 7 8\n8 7 8 7 8 7 8 7 8 7\n7 7 7 7 7 7 7 7 7 7\n8 8 8 7 8 7 8 7 8 7\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 7 8 8\n8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 8 7 7 7 8\n8 8 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 8 7 8\n7 7 7 7 7 8 8 8 8 8 8 8 8 8 7 7 8 8 7 7\n7 7 7 7 7 8 8 8 8 8 8 8 8 8 7 8 8 8 8 7\n8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 7 8 7 7 7\n8 8 8 8 8 8 7 8 8 8 8 8 7 8 8 7 7 7 8 8\n8 8 8 8 8 8 7 7 7 7 7 7 7 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 7 7 7 8 8 8 8 8 8 8 8 7\n8 8 8 8 8 8 8 8 7 8 7 8 8 8 8 8 8 8 7 8\n8 8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 7 7 8 8\n8 8 8 8 7 7 7 8 8 7 8 7 8 7 8 8 8 8 7 8\n8 8 8 7 7 7 8 8 8 7 8 7 8 7 8 8 8 8 8 7\n8 8 7 7 7 8 8 8 8 7 8 7 8 7 8 8 8 8 8 8\n8 7 7 7 8 8 8 8 8 7 8 7 8 7 8 8 8 8 8 8\n8 7 7 8 8 8 8 8 8 7 8 7 8 7 7 7 7 7 7 8\n8 7 7 8 8 8 8 8 8 7 8 7 7 8 7 8 7 8 7 8\n8 7 7 8 8 8 8 8 8 7 8 7 8 7 8 7 8 7 8 7\n7 7 7 7 8 8 8 8 8 7 7 7 7 7 7 7 7 7 7 7\n7 7 7 7 8 8 8 8 8 8 8 8 8 7 8 7 8 7 8 7\n\nTest Input 1:\n8 7 8 7 8 7 8 7 7 7\n8 8 8 8 8 8 8 8 8 8\n8 7 8 7 8 7 8 7 8 7\n7 8 7 8 7 8 7 8 8 7\n7 8 8 8 8 8 8 7 8 7\n7 7 7 7 7 7 8 7 8 7\n7 7 7 7 7 7 8 7 8 7\n8 7 7 7 7 7 8 7 8 7\n7 8 7 7 7 7 8 7 8 7\n7 7 8 8 8 8 8 8 8 8\n\nTest Input 2:\n6 6 6 6 6 5 5 5 5 5\n5 5 5 5 5 5 6 6 6 6\n6 6 6 5 6 6 6 6 6 6\n5 5 5 5 6 6 6 6 6 6\n5 5 6 6 6 6 6 6 6 6\n6 5 6 6 6 6 6 6 6 6\n5 5 5 5 5 6 6 6 6 6\n5 6 6 5 5 5 6 6 6 6\n5 6 6 6 5 5 5 6 6 6\n5 6 6 6 6 5 5 5 6 6\n5 6 6 6 6 6 5 5 5 6\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 8, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 8 + ], + [ + 8, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 7 + ], + [ + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 8, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 7 + ], + [ + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 7 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 7 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 7, + 7 + ], + [ + 8, + 7, + 7, + 7, + 7, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 8, + 8, + 8, + 7, + 7, + 7 + ], + [ + 7, + 8, + 7, + 7, + 7, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 8, + 8, + 8, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7, + 7, + 7, + 7 + ], + [ + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 8, + 8, + 8, + 7, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 8, + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7, + 7, + 7 + ], + [ + 8, + 7, + 7, + 7, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 7, + 7, + 8, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 8, + 8 + ], + [ + 7, + 8, + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7 + ], + [ + 7, + 8, + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7 + ] + ], + [ + [ + 6, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 6, + 5, + 5, + 5, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 6, + 5, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6 + ], + [ + 5, + 5, + 6, + 6, + 5, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 6, + 6, + 6, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 6, + 6, + 5, + 5, + 5, + 6, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 6, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6, + 6 + ], + [ + 6, + 5, + 6, + 6, + 6, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 5, + 6, + 6, + 6, + 6, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 5, + 5, + 5, + 6, + 6, + 6 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 6, + 6 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 6 + ], + [ + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 6 + ], + [ + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 5, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 6 + ], + [ + 5, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 6 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 5 + ], + [ + 5, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 5 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_4e34c42c", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 1 8 8 2 8 2 3 3 3 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 4 1 1 1 2 2 2 3 2 3 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 1 8 8 2 8 2 3 3 3 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 8 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 1 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 1 4 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 1 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 8 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 2 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n6 8 9 8 8 8 8 8 8 8 8 8\n6 1 1 1 8 8 2 8 2 3 3 3\n6 1 4 1 1 1 2 2 2 3 2 3\n6 1 1 1 8 8 2 8 2 3 3 3\n6 8 9 8 8 8 8 8 8 8 8 8\n\nTraining Example 2:\nInput:\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 4 4 4\n4 4 4 4 4 4 4 4 4 4 8 1 1 1 3 3 1 4 4 4\n4 1 1 1 4 4 4 4 4 4 8 4 4 1 4 4 1 4 4 4\n4 1 2 1 4 4 4 4 4 4 8 1 1 1 3 3 1 4 4 4\n4 1 1 1 4 4 4 4 4 4 4 4 4 1 1 1 1 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 1 1 1 4 4 4 4 4 4 4 5 3 5 4 4\n4 4 4 4 4 1 2 1 3 3 3 3 3 3 3 3 5 3 4 4\n4 4 4 4 4 1 1 1 4 4 4 4 4 4 4 5 3 5 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 6 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 5 3 5 6 6 8 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 3 5 3 6 6 8 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 5 3 5 6 6 8 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 6 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nOutput:\n4 4 4 4 4 4 4 4 4 4 4 6 6 6 4 4 4 4 1 1 1 1\n1 1 1 4 4 4 4 4 4 4 5 3 5 6 6 8 1 1 1 3 3 1\n1 2 1 3 3 3 3 3 3 3 3 5 3 6 6 8 4 4 1 4 4 1\n1 1 1 4 4 4 4 4 4 4 5 3 5 6 6 8 1 1 1 3 3 1\n4 4 4 4 4 4 4 4 4 4 4 6 6 6 4 4 4 4 1 1 1 1\n\nTest Input 1:\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 6 6 1 1 1 1 3 3 3 3 3 3 3 3 6 6 3 3\n3 3 8 6 1 3 3 8 8 8 3 3 3 9 9 9 6 8 3 3\n3 3 6 6 1 1 1 1 7 8 3 3 3 9 3 3 6 6 3 3\n3 3 3 3 3 3 3 8 8 8 3 3 3 9 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 1 1 1 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 1 7 1 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 4 4 4 3 3 3 3 3 1 7 8 3 3 3 3 3 3 3 3\n3 3 4 3 3 3 3 3 3 8 8 8 3 3 3 3 3 3 3 3\n3 3 4 3 3 3 3 3 3 3 7 3 3 3 3 3 3 3 3 3\n3 1 1 1 3 3 3 3 3 3 7 3 3 3 3 3 3 3 3 3\n3 1 6 1 3 3 3 3 3 3 7 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 2 2 2 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 1 1 1 3 3 3 1 1 1 3 3\n3 3 3 3 2 3 2 3 3 1 6 1 3 3 3 1 7 1 3 3\n3 3 3 3 4 4 4 3 3 3 8 3 3 3 3 3 8 3 3 3\n3 3 3 4 4 1 4 4 3 3 8 3 3 3 3 3 8 3 3 3\n3 3 3 3 4 4 4 3 3 3 8 3 3 3 3 3 8 3 3 3\n3 3 3 3 3 3 3 3 3 3 8 8 8 8 8 8 8 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 2 3 2 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n\nTest Input 2:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 2 2 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 2 4 2 1 1 1 1 3 2 2 1 1 1\n1 1 1 1 1 1 1 2 2 2 1 1 1 1 1 2 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 2 2 1 1 1\n1 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 2 4 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 2 2 2 1 1 1 1 1 4 4 4 1 6 1 6 1 8 8 8\n1 1 3 1 1 1 1 1 1 4 7 4 8 8 8 8 8 8 7 8\n9 9 3 9 9 1 1 1 1 4 4 4 8 1 1 1 8 8 8 8\n1 9 9 9 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 6 1 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 8 8 8 3 3 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 8 7 8 3 3 1 1 1 1 1 1\n1 1 1 6 4 4 4 1 1 8 8 8 3 3 3 1 1 1 1 1\n1 6 6 6 4 7 4 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 6 4 4 4 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 3, + 3 + ], + [ + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 9, + 9, + 9, + 6, + 8, + 6, + 1, + 3, + 3, + 8, + 8, + 8 + ], + [ + 3, + 4, + 3, + 3, + 3, + 3, + 3, + 9, + 3, + 3, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 7, + 8 + ], + [ + 3, + 4, + 3, + 3, + 3, + 3, + 3, + 9, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8 + ], + [ + 1, + 1, + 1, + 3, + 3, + 3, + 1, + 1, + 1, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 7, + 3 + ], + [ + 1, + 6, + 1, + 3, + 3, + 3, + 1, + 7, + 1, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 7, + 3 + ], + [ + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 7, + 3 + ], + [ + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 2, + 2, + 2 + ], + [ + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 2, + 3, + 2, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 4, + 4, + 1, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ] + ], + [ + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 2, + 4, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 9, + 9, + 3, + 9, + 9, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 9, + 9, + 9, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 6, + 4, + 4, + 4, + 1, + 6, + 1, + 6, + 1, + 8, + 8, + 8, + 3, + 3, + 3, + 2, + 2 + ], + [ + 6, + 6, + 6, + 4, + 7, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 3, + 3, + 1, + 2, + 1 + ], + [ + 1, + 1, + 6, + 4, + 4, + 4, + 8, + 1, + 1, + 1, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 2, + 2 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_21897d95", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n6 6 6 6 6 7 7 7 4 4 4 4\n6 6 6 6 6 7 7 7 4 4 4 4\n6 6 6 1 6 7 7 7 4 4 4 4\n6 6 6 3 1 7 7 7 4 9 9 9\n6 6 6 1 6 7 7 7 4 4 4 9\n6 6 6 6 6 7 7 7 4 4 4 9\n6 6 6 6 6 7 1 7 4 4 4 4\n6 6 6 6 6 7 1 1 4 4 4 4\n6 6 6 6 6 7 1 7 4 4 4 4\n6 6 6 6 6 7 7 7 4 4 4 4\n7 7 1 7 7 7 7 7 7 7 7 7\n7 1 0 1 7 7 7 7 7 1 1 1\n7 7 7 7 7 7 7 7 7 7 1 7\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n7 7 7 7 7 7 7 7 7 7 3 3 3 7 7 7\n7 7 7 7 7 7 7 7 7 7 3 3 3 7 7 7\n7 7 7 7 7 7 7 7 7 7 3 3 3 7 7 7\n7 7 7 7 7 7 7 7 7 7 3 3 3 7 7 7\n3 3 3 3 3 3 3 3 3 3 3 3 3 7 7 7\n3 3 3 3 3 3 3 3 3 3 3 3 3 7 7 7\n3 3 3 3 3 3 3 3 3 3 3 3 3 7 7 7\n0 0 0 0 0 0 0 0 0 0 3 3 3 7 7 7\n0 0 0 0 0 0 0 0 0 0 3 3 3 7 7 7\n0 0 0 0 0 0 0 0 0 0 3 3 3 7 7 7\n0 0 0 0 0 0 0 0 0 0 3 3 3 7 7 7\n0 0 0 0 0 0 0 0 0 0 3 3 3 7 7 7\n\nTraining Example 2:\nInput:\n7 7 7 7 7 7 1 7 3 3\n7 7 7 7 7 7 1 1 3 3\n7 7 7 7 7 7 1 7 3 3\n8 8 8 3 1 7 7 7 3 1\n8 8 8 1 1 7 7 7 1 6\n8 1 8 3 1 7 7 7 3 1\n8 1 1 3 3 1 9 1 3 3\n8 1 8 3 3 7 1 7 3 3\n8 8 8 3 3 5 5 5 3 3\n8 8 8 3 3 5 5 5 3 3\n\nOutput:\n6 6 6 6 6 6 6 6 7 7\n6 6 6 6 6 6 6 6 7 7\n6 6 6 6 6 6 6 6 7 7\n3 3 3 8 8 6 6 6 7 7\n3 3 3 8 8 6 6 6 7 7\n3 3 3 8 8 6 6 6 7 7\n3 3 3 8 8 6 6 6 7 7\n3 3 3 8 8 6 6 6 7 7\n3 3 3 8 8 9 9 9 7 7\n3 3 3 8 8 9 9 9 7 7\n\nTraining Example 3:\nInput:\n6 6 6 3 1 3 3 3 3\n6 6 6 1 1 3 3 3 3\n6 6 6 3 1 3 3 3 3\n6 6 6 4 4 4 4 1 4\n6 6 6 4 4 4 1 1 1\n6 6 6 4 4 4 4 4 4\n6 6 6 6 1 6 4 4 4\n6 6 6 6 1 1 4 4 4\n6 6 6 6 1 6 4 4 4\n5 5 5 4 4 4 4 4 4\n9 9 9 8 8 8 8 8 8\n9 5 5 8 8 8 1 7 1\n9 5 5 8 8 8 8 1 8\n5 5 5 4 4 4 4 4 4\n\nOutput:\n5 5 5 5 5 3 3 3 3 3 3 3 3 3\n5 5 5 5 5 3 3 3 3 3 3 3 3 3\n5 5 5 5 5 3 3 3 3 3 3 3 3 3\n7 8 8 8 6 3 3 3 6 6 6 4 4 4\n7 8 8 8 6 3 3 3 6 6 6 4 4 4\n7 8 8 8 6 3 3 3 6 6 6 4 4 4\n7 8 8 8 6 6 6 6 6 6 6 4 4 4\n7 8 8 8 6 6 6 6 6 6 6 4 4 4\n7 8 8 8 6 6 6 6 6 6 6 4 4 4\n\nTraining Example 4:\nInput:\n2 2 2 2 2 1 2 3 3 3\n2 2 2 2 2 1 1 3 3 3\n2 2 2 2 2 1 2 3 3 3\n6 6 6 6 1 6 6 3 1 3\n6 6 6 1 1 1 6 1 1 3\n1 1 1 6 6 6 6 3 1 3\n6 1 6 6 6 6 6 3 3 3\n4 4 4 4 4 4 4 3 3 3\n4 4 4 4 4 4 4 3 3 3\n4 4 4 4 4 4 4 3 3 3\n\nOutput:\n6 6 6 6 6 6 6 2 2 2\n6 6 6 6 6 6 6 2 2 2\n6 6 6 6 6 6 6 2 2 2\n3 3 3 3 3 3 3 2 2 2\n3 3 3 3 3 3 3 2 2 2\n3 3 3 3 3 3 3 2 2 2\n3 3 3 3 3 3 3 2 2 2\n6 6 6 6 6 6 6 2 2 2\n6 6 6 6 6 6 6 2 2 2\n6 6 6 6 6 6 6 2 2 2\n\nTest Input 1:\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 7 7 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 3 3 3 1 3 3 3 3 3 3 9 9 9 7 7 7 7 9 9\n9 9 9 9 3 3 3 3 3 3 3 3 3 1 1 1 3 3 3 3 3 9 9 9 7 7 7 7 9 9\n9 9 9 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 9 9 7 7 7 7 9 9\n9 9 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 9 9 9 1 9 9 9 9\n9 9 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 9 9 1 1 1 9 9 4\n9 3 3 3 3 0 1 0 0 0 0 0 0 0 0 0 3 3 3 3 3 3 9 9 9 9 9 9 4 4\n9 3 3 3 0 1 8 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 9 9 9 9 9 4 4 4\n9 3 3 0 0 0 0 0 0 0 0 0 0 2 1 2 2 0 0 0 0 0 9 9 9 9 9 4 4 4\n9 3 3 0 0 0 0 0 0 0 2 2 2 1 1 1 2 2 2 2 0 0 9 9 9 9 4 4 4 4\n9 3 3 0 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 0 9 9 9 9 4 4 4 4\n9 3 3 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 2 2 9 9 9 9 4 4 4 4\n9 3 3 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 9 9 4 4 4 4 4\n6 6 6 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 9 9 4 4 4 4 4\n6 6 6 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 9 9 4 4 4 4 4\n6 6 6 6 0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 2 2 2 2 9 9 4 4 4 4 4\n6 6 6 6 0 0 1 1 1 0 0 0 0 0 0 2 2 2 2 2 2 2 2 2 9 4 4 4 4 4\n6 6 6 6 6 6 0 1 0 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 9 4 4 4 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 0 0 2 2 2 2 2 2 2 2 2 2 9 4 4 4 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 1 6 2 2 2 2 2 2 2 2 2 2 9 9 4 4 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 1 1 2 2 2 2 2 2 2 2 2 9 9 9 4 4 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 1 6 9 2 2 2 2 2 2 2 2 9 9 9 8 8 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 9 2 2 2 2 2 2 2 9 9 9 8 8 8 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 6 9 9 9 2 2 2 2 9 9 9 9 8 8 8 8 4 4\n6 6 6 6 6 6 6 6 6 6 6 9 9 9 9 9 9 9 9 9 9 9 8 8 8 8 8 8 1 8\n6 6 6 6 6 9 9 9 9 9 9 9 9 9 9 9 8 8 8 8 8 8 8 8 8 8 8 1 1 1\n9 9 9 9 9 9 9 9 9 9 9 9 1 9 9 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n9 9 9 9 9 9 9 9 9 9 9 9 0 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n9 9 9 9 9 9 9 9 9 9 9 9 1 9 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nTest Input 2:\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 1 1 1 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 1 5 5\n3 3 1 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 1 1 1 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 9 9 9 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 9 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 9 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 1 7 1 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 1 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 4 4 4 4 4 4 1 4 4 4 4 4 6 6 6 6 6 6\n3 3 3 3 3 3 4 4 4 4 4 1 1 1 4 4 4 4 6 6 6 6 6 6\n3 3 3 3 3 3 4 4 4 4 4 4 4 4 4 4 4 4 6 6 1 1 1 6\n3 3 3 3 3 3 4 4 4 4 4 4 4 4 4 4 4 4 6 6 6 1 6 6\n2 2 1 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 1 1 1 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 9, + 9, + 9, + 9, + 3, + 3 + ], + [ + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 9, + 9, + 9, + 9, + 3, + 3 + ], + [ + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 9, + 9, + 9, + 9, + 3, + 3 + ], + [ + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 3, + 8, + 8, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 8 + ], + [ + 3, + 8, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8 + ], + [ + 3, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 2, + 2, + 2, + 2, + 2, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8 + ], + [ + 3, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 2, + 2, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8 + ], + [ + 3, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 2, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8 + ], + [ + 3, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8 + ], + [ + 3, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 0, + 0, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 0, + 0, + 0, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_abc82100", + "problem_text": "ARC Puzzle: Predict the test output grid.\n\nTraining Example 1:\nInput:\n1 2 8 8 8\n0 0 0 0 1\n0 0 0 1 0\n0 0 0 1 0\n0 0 0 0 1\n\nOutput:\n0 0 0 0 0\n0 0 0 0 2\n0 0 0 2 2\n0 0 0 2 2\n0 0 0 0 2\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 6 0 6 0 6 0 6 0 6 0 6 0 6 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 0 0 0 0 0 0 0 0 0 0 0 4 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 0 0 0 0 0 0 0 0 0 0 0 4 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 0 0\n0 2 0 8 0 8 0 0 0 0 0 0 0 4 0\n0 0 0 0 7 0 0 0 0 0 0 0 0 0 0\n0 8 0 0 6 0 0 8 0 0 0 0 0 0 0\n8 0 4 2 0 4 2 0 8 0 0 0 0 0 0\n0 8 0 0 7 0 0 8 0 0 0 0 0 2 0\n0 0 0 0 6 0 0 0 0 0 0 0 0 0 0\n0 7 0 8 0 8 0 7 0 7 0 7 0 0 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 7 0 7 0 7 0 7 0 7 0 7 0 7 0\n7 0 7 0 7 0 7 0 7 0 7 0 7 0 7\n0 4 0 0 0 0 0 0 0 0 0 0 0 2 0\n4 0 0 0 0 0 0 0 0 0 0 0 0 0 2\n0 4 0 0 0 0 0 0 0 0 0 0 0 2 0\n4 0 0 0 0 0 0 0 0 0 0 0 0 0 2\n0 4 0 0 0 0 0 0 0 0 0 0 0 2 0\n4 0 0 0 0 0 0 0 0 0 0 0 0 0 2\n0 4 0 0 0 0 0 0 0 0 0 0 0 2 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 4 0\n0 0 0 0 0 0 0 0 0 0 0 0 4 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 4 0\n6 0 6 0 0 0 6 0 6 0 6 0 6 0 0\n0 6 0 0 0 0 0 6 0 6 0 6 0 0 0\n\nTraining Example 3:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 4 0 0 0 0 0 0 0 0 0 0 0 4 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 0 0 0 0 8 0 0 0 4 0 0 0 4 0 0\n0 0 0 0 0 0 0 0 8 0 8 0 0 0 0 0 0 0 0 0\n0 0 0 4 0 0 0 8 0 0 0 8 0 0 0 4 0 0 0 0\n0 0 0 0 0 0 8 0 0 0 0 0 8 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 8 0 0 0 8 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 8 0 8 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 8 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 2 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 4 0 0 0 0 0 0 0 0 0 0\n0 0 1 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 7 0 0 0 0 0\n1 0 0 0 1 0 0 0 0 0 0 0 8 0 0 0 8 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 8 0 8 0 0 0 0\n0 0 1 0 0 0 0 0 0 0 0 0 0 0 8 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 8 0 8 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 8 0 0 0 8 0 0 0\n\nOutput:\n0 2 0 2 0 2 0 0 0 0 0 2 0 2 0 2 0 2 0 2\n0 0 2 0 2 0 0 0 0 0 2 0 0 0 2 0 2 0 0 0\n0 2 0 2 0 2 0 0 0 0 0 2 0 2 0 2 0 2 0 2\n2 0 2 0 0 0 2 0 0 0 0 0 2 0 2 0 2 0 2 0\n0 2 0 0 0 2 0 0 0 0 0 0 0 2 0 0 0 2 0 0\n0 0 2 0 2 0 0 0 0 0 0 0 0 0 2 0 2 0 0 0\n0 0 0 2 0 0 0 0 0 0 0 0 0 0 0 2 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n7 0 0 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 7 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 7 0 0 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 7 0 7 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n7 0 0 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 7 0 7 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 7 0 0 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTraining Example 4:\nInput:\n1 1 1 1 1 2 0 0\n0 0 0 0 0 2 0 0\n0 0 0 0 0 2 0 0\n0 2 1 8 0 2 0 0\n0 0 0 0 0 2 0 0\n0 0 8 0 0 2 0 0\n0 0 2 0 0 2 0 0\n0 0 1 0 0 2 0 0\n\nOutput:\n2 2 2 2 2 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n\nTest Input:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 6 0 0\n2 0 0 8 0 0 0 6 0 0 0 0 0 0 0 0 0 0 0 6\n0 4 1 8 0 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0\n0 0 0 8 0 0 0 0 0 0 0 0 0 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 0 0 0 0 4 0 0\n0 2 4 8 0 8 0 0 0 0 0 2 0 0 0 0 0 0 0 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 2 0 0 0 0 0 0 0 0 0 0 0 5 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 4 0 0 0 0 0 0\n0 5 7 8 8 0 0 0 0 5 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 0 0 0 2 0 0 0 0 0 0 0 2 0 0 0 0 0 6\n0 0 0 0 0 0 0 0 0 4 0 0 0 0 0 0 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 4 0 0 6 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n5 0 0 0 0 0 0 0 0 6 0 0 0 0 0 0 0 0 0 0\n\nGive your answer in ... tags, space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 0, + 0 + ], + [ + 4, + 0, + 4, + 0, + 0, + 0, + 0, + 6, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6 + ], + [ + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 1, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 1, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 4, + 0, + 0, + 0, + 1, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 4, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 7, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 7, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 4, + 0, + 0 + ], + [ + 0, + 4, + 0, + 4, + 0, + 4, + 0, + 4, + 0, + 1, + 0, + 0, + 0, + 4, + 0, + 4, + 0, + 0, + 0, + 6 + ], + [ + 0, + 0, + 4, + 7, + 0, + 0, + 4, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 6, + 0, + 0, + 0 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ] + ], + "num_test_pairs": 1, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_9bbf930d", + "problem_text": "ARC Puzzle: Predict the test output grid.\n\nTraining Example 1:\nInput:\n6 7 1 1 1 1 1 1 1 1 1 1 1 7 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 1 1 1 1 1 1 1 1 1 1 1 4 7 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 4 7 4\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 7 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 4\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 0 0 0 0 0 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 7 9 9 9 9 9 9 9 9 9 9 9 9 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 9\n6 7 7 9 9 9 9 9 9 9 9 9 9 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 9 7 9\n6 7 7 8 8 8 8 8 8 8 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 3 3 3 3 3 3 3 7 7\n\nOutput:\n6 7 1 1 1 1 1 1 1 1 1 1 1 7 6 7\n7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 6\n6 7 1 1 1 1 1 1 1 1 1 1 1 4 7 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 4 7 4\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 7 4\n7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 4\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 0 0 0 0 0 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 7 9 9 9 9 9 9 9 9 9 9 9 9 9\n7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 9\n6 7 7 9 9 9 9 9 9 9 9 9 9 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 9 7 9\n6 7 7 8 8 8 8 8 8 8 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 3 3 3 3 3 3 3 6 7\n\nTraining Example 2:\nInput:\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 8 8 8 8 8 8 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 1 1 1 1 1 1 1 1 1 1 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 1 1 1 1 1 1 1 1 1 1 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 5 5 5 5 5 5 5 5 5 5 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 0 0 0 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 0 0 0 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 9 9 9 9 9 9 9 9 9 9 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n\nOutput:\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 8 8 8 8 8 8 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 1 1 1 1 1 1 1 1 1 1 7 7\n7 7 7 7 7 7 7 7 7 7 7 7 7 6\n6 7 1 1 1 1 1 1 1 1 1 1 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 5 5 5 5 5 5 5 5 5 5 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 0 0 0 7 7\n7 7 7 7 7 7 7 7 7 7 7 7 7 6\n6 7 0 0 0 0 0 0 0 0 0 0 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 9 9 9 9 9 9 9 9 9 9 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n7 7 7 7 7 7 7 7 7 7 7 7 7 6\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n\nTraining Example 3:\nInput:\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 7 7 7 7 7 7 7 7 4 7 7 7 7 7 4\n6 7 4 4 4 4 4 4 7 4 7 4 4 4 7 4\n6 7 7 7 7 7 7 4 7 4 7 4 7 4 7 4\n6 7 2 2 2 2 2 2 7 7 7 7 7 4 7 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 2 2 2 2 2 2 7 5 7 5 7 9 7 0\n6 7 7 7 7 7 7 7 7 5 7 5 7 9 7 0\n6 7 5 5 5 5 5 5 5 5 7 5 7 9 7 0\n6 7 7 7 7 7 7 7 7 7 7 5 7 9 7 0\n6 7 5 5 5 5 5 5 5 5 5 5 7 9 7 0\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 7 7 7 3 3 3 3 3 3\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 3\n6 7 3 3 3 3 3 7 7 7 3 3 3 3 7 3\n6 7 7 7 7 7 7 7 7 7 7 7 7 3 7 3\n6 7 0 0 0 0 0 0 0 0 0 0 0 0 7 7\n\nOutput:\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n7 7 7 7 7 7 7 7 7 4 7 7 7 7 7 4\n6 7 4 4 4 4 4 4 7 4 7 4 4 4 7 4\n6 7 7 7 7 7 7 4 7 4 7 4 7 4 7 4\n6 7 2 2 2 2 2 2 7 7 7 7 7 4 7 4\n7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 6\n6 7 2 2 2 2 2 2 7 5 7 5 7 9 7 0\n6 7 7 7 7 7 7 7 6 5 7 5 7 9 7 0\n6 7 5 5 5 5 5 5 5 5 7 5 7 9 7 0\n7 7 7 7 7 7 7 7 7 7 7 5 7 9 7 0\n6 7 5 5 5 5 5 5 5 5 5 5 7 9 7 0\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 6 7\n6 7 3 3 3 3 3 7 7 7 3 3 3 3 3 3\n7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 3\n6 7 3 3 3 3 3 7 7 7 3 3 3 3 7 3\n6 7 7 7 7 7 7 7 7 7 7 7 7 3 7 3\n6 7 0 0 0 0 0 0 0 0 0 0 0 0 6 7\n\nTest Input:\n6 7 9 9 9 9 9 9 9 7 7 7 7 7 7 7 9 9 9 9 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 9\n6 7 9 9 9 9 9 9 9 7 7 7 7 0 7 0 9 9 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 0 7 0 7 7 9 7 9\n6 7 0 0 0 0 0 0 0 7 7 7 0 0 7 0 7 7 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 0 7 7 9 7 9\n6 7 0 0 0 0 0 0 0 7 7 7 0 0 0 0 7 7 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 0 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 7 7 7 0 7 0 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 1 7 1 7 0 7 0 7 7 7 7 7 7\n6 7 8 8 8 8 8 7 1 7 1 7 0 7 0 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 1 7 1 7 0 7 0 7 7 7 7 7 7\n6 7 1 1 1 1 1 1 1 7 1 7 0 7 0 7 7 7 7 7 7\n6 7 7 7 7 7 7 7 7 7 1 7 0 7 0 0 0 7 7 7 7\n6 7 1 1 1 1 1 1 1 1 1 7 0 7 7 7 7 7 7 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 0 0 0 0 0 7 7 7 7\n6 7 4 4 4 4 4 4 4 4 7 7 7 4 4 4 4 7 7 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 4 7 7 7 7\n6 7 4 4 4 4 4 4 4 4 2 7 2 4 4 7 4 7 7 7 7\n6 7 7 7 7 7 7 7 7 7 2 7 2 7 4 7 4 7 9 7 9\n6 7 2 2 2 2 2 2 2 2 2 7 2 7 4 7 4 9 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 2 7 7 7 7 7 7 7 9\n6 7 2 2 2 2 2 2 2 2 2 2 2 7 7 7 7 9 9 9 9\n\nGive your answer in ... tags, space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 6, + 7, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 6, + 7, + 6, + 7, + 7, + 6, + 7, + 9, + 9, + 9, + 9, + 9 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 9 + ], + [ + 6, + 7, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 7, + 7, + 7, + 7, + 0, + 7, + 0, + 9, + 9, + 9, + 7, + 9 + ], + [ + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 7, + 0, + 7, + 7, + 9, + 7, + 9 + ], + [ + 6, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0, + 0, + 7, + 0, + 7, + 7, + 9, + 7, + 9 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 7, + 7, + 9, + 7, + 9 + ], + [ + 6, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 7, + 7, + 9, + 7, + 9 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0, + 7, + 0, + 8, + 8, + 8, + 8, + 7, + 7 + ], + [ + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 1, + 7, + 1, + 7, + 0, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 8, + 8, + 8, + 8, + 8, + 7, + 1, + 7, + 1, + 7, + 0, + 7, + 0, + 8, + 8, + 8, + 8, + 7, + 7 + ], + [ + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 1, + 7, + 1, + 7, + 0, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 1, + 7, + 0, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 1, + 7, + 0, + 7, + 0, + 0, + 0, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 6 + ], + [ + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 4, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 7, + 2, + 4, + 4, + 7, + 4, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 2, + 7, + 2, + 7, + 4, + 7, + 4, + 7, + 9, + 7, + 9 + ], + [ + 6, + 7, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 7, + 2, + 7, + 4, + 7, + 4, + 9, + 9, + 7, + 9 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 2, + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 9 + ], + [ + 6, + 7, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 7, + 7, + 6, + 7, + 9, + 9, + 9, + 9 + ] + ] + ], + "num_test_pairs": 1, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_a32d8b75", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 6 5 5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 5 5\n0 7 7 7 0 6 5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n0 7 7 4 0 6 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n0 7 4 7 0 6 5 5 5 3 3 3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 3 3 3 3\n0 0 0 0 0 6 5 5 5 3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3\n0 0 0 0 0 6 5 5 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n1 1 1 0 0 6 5 5 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 1 0 0 6 5 5 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 1 0 0 6 5 3 3 3 3 8 8 8 8 8 8 8 1 1 1 8 8 8 8 8 8 8 8 3\n0 1 1 1 0 6 5 3 3 3 8 8 8 8 8 8 8 1 1 1 1 8 8 8 8 8 8 8 8 3\n1 1 1 1 1 6 5 3 3 3 8 8 8 8 8 8 8 1 1 1 1 8 8 8 8 8 8 8 8 3\n1 0 1 0 1 6 5 3 3 3 8 8 8 8 8 8 8 1 1 1 1 8 8 8 8 8 8 8 8 3\n6 6 6 6 6 6 5 3 3 3 8 8 8 8 8 8 8 8 1 1 8 8 8 8 8 8 8 8 8 3\n6 0 0 0 6 6 5 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3\n6 0 0 0 6 6 5 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3\n6 0 0 4 6 6 5 5 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3\n6 6 6 6 6 6 5 5 5 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3\n6 0 0 0 6 6 5 5 5 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 5\n6 0 7 0 6 6 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 5 5\n6 0 7 0 6 6 5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 5 5 5\n\nOutput:\n5 5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 5 5\n5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n5 5 5 3 3 3 3 3 3 4 4 4 3 3 3 4 4 4 3 3 3 4 4 4\n5 5 5 3 3 3 3 3 3 4 4 7 8 8 8 4 4 7 8 8 3 4 4 7\n5 5 5 3 3 3 3 3 3 4 7 4 8 8 8 4 7 4 8 8 8 4 7 4\n5 5 3 3 3 3 3 8 8 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n5 5 3 3 3 3 8 8 8 4 4 7 4 4 7 4 4 7 4 4 7 4 4 7\n5 5 3 3 3 8 8 8 8 4 7 4 4 7 4 4 7 4 4 7 4 4 7 4\n5 3 3 3 3 8 8 8 8 8 8 8 4 4 4 4 4 4 4 4 4 8 8 3\n5 3 3 3 8 8 8 8 8 8 8 1 4 4 7 4 4 7 4 4 7 8 8 3\n5 3 3 3 8 8 8 8 8 8 8 1 4 7 4 4 7 4 4 7 4 8 8 3\n5 3 3 3 8 8 8 8 8 8 8 1 1 1 1 4 4 4 8 8 8 8 8 3\n5 3 3 3 8 8 8 8 8 8 8 8 1 1 8 4 4 7 8 8 8 8 8 3\n5 3 3 3 8 8 8 8 8 8 8 8 8 8 8 4 7 4 8 8 8 8 3 3\n5 3 3 3 3 8 8 8 8 8 8 8 8 8 8 4 4 4 8 8 8 8 3 3\n5 5 3 3 3 8 8 8 8 8 8 8 8 8 8 4 4 7 8 8 8 3 3 3\n5 5 5 3 3 3 8 8 8 8 8 8 8 8 8 4 7 4 8 8 3 3 3 3\n5 5 5 3 3 3 3 8 8 8 8 8 8 8 8 4 4 4 4 4 4 4 4 4\n5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 4 4 7 4 4 7 4 4 7\n5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 4 7 4 4 7 4 4 7 4\n\nTraining Example 2:\nInput:\n0 0 0 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 1 1 2 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 1 1 1 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 2 1 2 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 0 0 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 4 0 4 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 0 4 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 0 4 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 4 0 4 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 4 0 4 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 0 4 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 0 0 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 6 6 6 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 4 0 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 0 0 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 0 0 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 6 6 6 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 0 7 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 0 7 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 0 0 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n\nOutput:\n2 2 1 8 8 9 2 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n2 2 2 8 8 9 2 2 2 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n1 2 1 8 8 9 1 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 2 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 1 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 2 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 1 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n2 2 1 8 8 9 2 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n2 2 2 8 8 9 2 2 2 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n1 2 1 8 8 9 1 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n2 2 1 8 8 9 2 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n2 2 2 8 8 9 2 2 2 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n1 2 1 8 8 9 1 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 2 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 1 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n\nTraining Example 3:\nInput:\n0 0 0 0 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 3 3 3 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 8 3 8 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 8 3 3 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 0 0 0 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 2 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 2 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 2 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 0 0 0 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n6 6 6 6 6 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n6 0 0 4 6 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n6 0 0 0 6 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n6 0 0 0 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 6 6 6 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 0 0 0 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 0 7 7 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 0 0 0 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nOutput:\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 8 8 8 8 8 8 8 8 8\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 8 3 3 8 3 3 8 3\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 8 8 3 8 8 3 8 8\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 8 8 8 5 5 5 8 8 8\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 8 3 5 5 5 3 8 3\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 3 8 8 4 4 4 3 8 8\n4 4 4 4 4 4 4 4 4 8 8 8 8 8 8 8 8 8 4 4 4 8 8 8\n4 4 4 4 4 4 4 4 4 3 8 3 3 8 3 3 8 3 4 4 4 3 8 3\n4 4 4 4 4 4 4 4 4 3 8 8 3 8 8 3 8 8 4 4 4 3 8 8\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nTest Input 1:\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 1 1 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 1 3 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 2 4 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 4 2 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 3 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 3 3\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 3\n0 7 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 3 3 3 3\n7 7 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 3 0 3 0\n7 0 0 7 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 3 3 3 3\n7 7 7 7 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 7 0 0 6 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 6 0 0 0 0\n0 7 7 7 6 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 6 0 0 0 0\n0 0 0 7 6 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 6 0 0 0 0\n0 7 7 7 6 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n6 6 6 6 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 6 6 6 6\n6 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 4 0 0 6\n6 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 6\n6 0 0 4 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 6\n6 6 6 6 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 6 6 6 6\n6 0 7 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 6\n6 0 7 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 7 0 6\n6 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 7 0 6\n\nTest Input 2:\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 2 2 2 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 3 3 3 3 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 2 2 2 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 3 3 3 3 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 2 2 2 2 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 4 4 4 4 4 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 4 4 0 0 4 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 4 0 0 0 4 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 4 4 4 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 6 6 6 6 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 0 0 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 0 0 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 4 0 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 6 6 6 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 0 0 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 7 7 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 0 0 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 4, + 2, + 4, + 2, + 4, + 2, + 4, + 2, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 2, + 4, + 2, + 4, + 2, + 4, + 2, + 4, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 4, + 2, + 9, + 9, + 4, + 2, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 2, + 4, + 9, + 9, + 2, + 4, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 4, + 2, + 4, + 2, + 4, + 2, + 4, + 2, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 2, + 4, + 2, + 4, + 2, + 4, + 2, + 4, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 4, + 2, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 2, + 4, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 4, + 2, + 4, + 2, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 2, + 4, + 2, + 4, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 4, + 2, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 2, + 4, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 1, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 3, + 1, + 3, + 1, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 3, + 3, + 9, + 9, + 9, + 9, + 3, + 3 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 3, + 1, + 9, + 9, + 9, + 9, + 3, + 1 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 3, + 1, + 3, + 1, + 3, + 1, + 3, + 1 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 3, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 1, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 1, + 3, + 1, + 3, + 1 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 3, + 3 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 3, + 1 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 1, + 3, + 1, + 3, + 1 + ] + ], + [ + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 2, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 2, + 2, + 2, + 2, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 4 + ], + [ + 3, + 2, + 2, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 2, + 2, + 2, + 2, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 4 + ], + [ + 2, + 2, + 2, + 2, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 2, + 2, + 3, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 4 + ], + [ + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 3, + 2, + 2, + 2, + 2, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 3, + 3, + 1, + 1 + ], + [ + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 1, + 1, + 1, + 1, + 1, + 2, + 2, + 2, + 2, + 3, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 3, + 3, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1 + ], + [ + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1 + ], + [ + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_e12f9a14", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 3 3 8 8 8 8 8 8 3 3 8 8 8 3 8 3 3 8 8 8\n8 8 8 3 9 9 3 8 8 8 8 3 1 1 3 8 8 3 4 4 3 8 8 8\n8 8 8 3 9 9 3 8 8 8 8 3 1 1 3 8 8 3 4 4 3 8 8 8\n8 8 8 8 3 3 8 8 8 8 8 8 3 3 8 8 8 3 8 3 3 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 6 6 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 6 6 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 8 8 1 4 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 8 1 4 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 8 1 4 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 1 4 8 8 8 8 8\n9 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 1 4 8 8 8 8 8\n8 9 8 8 8 8 8 8 9 1 8 8 8 8 8 8 1 8 4 8 8 8 8 8\n8 8 9 8 8 8 8 9 8 8 1 8 8 8 8 1 8 8 4 8 8 8 8 8\n8 8 8 9 3 3 9 8 8 8 8 1 3 3 1 8 8 3 4 3 3 8 8 8\n8 8 8 3 9 9 3 8 8 8 8 3 1 1 3 8 8 3 4 4 3 8 8 8\n8 8 8 3 9 9 3 8 8 8 8 3 1 1 3 8 8 3 4 4 3 8 8 8\n8 8 8 9 3 3 9 8 8 8 8 1 3 3 1 8 8 3 4 3 3 8 8 8\n8 8 9 8 8 8 8 9 8 8 1 8 8 8 8 1 8 8 4 8 8 8 8 8\n8 9 8 8 8 8 8 8 9 1 8 8 8 8 8 8 1 8 4 8 8 8 8 8\n9 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 1 4 8 8 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 1 4 8 8 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8 8 8\n8 3 3 3 3 8 8 8 9 1 8 8 8 8 8 8 8 8 8 1 4 8 8 8\n8 3 6 6 6 6 6 6 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8 8\n8 3 6 6 3 8 8 8 6 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8\n8 3 3 3 3 8 8 8 8 6 8 9 1 8 8 8 8 8 8 8 1 4 8 8\n8 8 8 8 8 8 8 8 8 8 6 8 9 1 8 8 8 8 8 8 8 1 4 8\n\nTraining Example 2:\nInput:\n8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8\n8 3 3 8 3 8 8 8\n8 3 4 4 3 8 8 8\n8 3 4 4 8 8 8 8\n8 8 3 3 3 8 8 8\n8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 4 8 8 8 8\n8 8 8 4 8 8 8 8\n8 3 3 4 3 8 8 8\n8 3 4 4 3 8 8 8\n8 3 4 4 4 4 4 4\n8 4 3 3 3 8 8 8\n4 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8\n\nTraining Example 3:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 2 2 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 2 2 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 3 8 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 4 4 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 4 4 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 3 3 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 7 7 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 3 7 7 3 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 8 4\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 8 4 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 8 4 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 8 4 8 8 8\n8 8 8 3 3 3 3 8 8 8 8 8 8 2 8 4 8 8 8 8\n8 8 8 3 2 2 2 2 2 2 2 2 2 8 4 8 8 8 8 8\n2 2 2 2 2 2 3 8 8 8 8 8 8 4 8 8 8 8 8 8\n8 8 8 3 3 3 3 8 8 8 8 8 8 4 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 4 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 3 4 3 8 8 8 8 8\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 4 4 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 3 3 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n7 7 7 7 7 7 7 7 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 3 7 7 3 8 8 8 8 8 8 8 8 8 8 8\n\nTraining Example 4:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 3 8 3 8 8 8 8 8 8 8 8\n8 3 6 6 3 8 8 8 8 8 8 8\n8 3 6 6 3 8 8 8 8 8 8 8\n8 8 3 3 3 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 6 8 8 8 6 8 8 8 8 8\n8 8 6 8 8 6 8 8 8 8 8 8\n8 3 6 3 6 8 8 8 8 8 8 8\n8 3 6 6 3 8 8 8 8 8 8 8\n8 3 6 6 3 8 8 8 8 8 8 8\n8 6 3 3 3 8 8 8 8 8 8 8\n6 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n\nTest Input 1:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 8 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 2 2 8 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 2 2 8 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 8 8 0 0 0 0 0\n0 0 0 0 0 8 8 0 0 0 0 8 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 8 3 3 8 0 0 8 4 4 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 8 3 3 8 0 0 8 4 4 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 8 0 8 0 0 0 0 8 0 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 8 8 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 7 7 8 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 7 7 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 0 8 8 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTest Input 2:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 8 3 3 8 8 8 8 8 8 8 8 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 2 2 3 8 8 8 8 8 8 8 3 4 4 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 2 2 3 8 8 8 8 8 8 8 3 4 4 3 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 3 3 8 8 8 8 8 8 8 8 3 8 3 3 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 8 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 6 6 3 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 6 6 3 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 7 7 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 7 7 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n3 3 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n3 9 9 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n3 9 9 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 2, + 0, + 0, + 0, + 0, + 2, + 0, + 0, + 0 + ], + [ + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 2, + 8, + 8, + 2, + 0, + 0, + 0, + 0 + ], + [ + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 8, + 2, + 2, + 8, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 2, + 2, + 8, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 2, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 3, + 8, + 8, + 3, + 0, + 0, + 4, + 8, + 8, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 8, + 4, + 4, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 8, + 4, + 4, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 3, + 8, + 3, + 0, + 0, + 4, + 8, + 4, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 7, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 7, + 7, + 8, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 7, + 8, + 8, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 6 + ], + [ + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 6, + 8 + ], + [ + 2, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 6, + 8, + 8 + ], + [ + 8, + 2, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 6, + 8, + 8, + 8 + ], + [ + 9, + 8, + 2, + 3, + 2, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 6, + 8, + 8, + 8, + 8 + ], + [ + 8, + 9, + 8, + 2, + 2, + 2, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 8, + 6, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 2, + 2, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 4, + 4, + 3, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 3, + 3, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 4, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 6 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 6, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 6, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 6, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 6, + 3, + 6, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 6, + 6, + 3, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 6, + 6, + 3, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 6, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 6, + 6 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 3, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 3, + 7, + 7, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 3, + 3, + 3, + 7, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 8, + 8, + 8 + ], + [ + 3, + 3, + 9, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 8, + 8 + ], + [ + 3, + 9, + 9, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 8 + ], + [ + 3, + 9, + 9, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8 + ], + [ + 3, + 3, + 3, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7 + ], + [ + 8, + 8, + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_13e47133", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n7 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 8\n1 8 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 4 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 3 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 2 1 1 1\n1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n7 7 7 7 7 7 7 7 2 8 8 8 8 8 8 8 8 8 8 8\n7 8 8 8 8 8 8 7 2 8 4 4 4 4 4 4 4 4 4 8\n7 8 7 7 7 7 8 7 2 8 4 8 8 8 8 8 8 8 4 8\n7 8 7 8 8 7 8 7 2 8 4 8 4 4 4 4 4 8 4 8\n7 8 7 8 8 7 8 7 2 8 4 8 4 8 8 8 4 8 4 8\n7 8 7 8 8 7 8 7 2 8 4 8 4 4 4 4 4 8 4 8\n7 8 7 8 8 7 8 7 2 8 4 8 8 8 8 8 8 8 4 8\n7 8 7 8 8 7 8 7 2 8 4 4 4 4 4 4 4 4 4 8\n7 8 7 8 8 7 8 7 2 8 8 8 8 8 8 8 8 8 4 8\n7 8 7 8 8 7 8 7 2 2 2 2 2 2 2 2 2 8 4 8\n7 8 7 8 8 7 8 7 2 3 3 3 3 3 3 3 2 8 4 8\n7 8 7 8 8 7 8 7 2 3 3 3 3 3 3 3 2 8 4 8\n7 8 7 8 8 7 8 7 2 3 3 3 3 3 3 3 2 8 4 8\n7 8 7 8 8 7 8 7 2 3 3 3 3 3 3 3 2 8 4 8\n7 8 7 8 8 7 8 7 2 3 3 3 3 3 3 3 2 8 4 8\n7 8 7 8 8 7 8 7 2 2 2 2 2 2 2 2 2 8 4 8\n7 8 7 8 8 7 8 7 2 8 8 8 8 8 8 8 8 8 4 8\n7 8 7 7 7 7 8 7 2 8 4 4 4 4 4 4 4 4 4 8\n7 8 8 8 8 8 8 7 2 8 4 4 4 4 4 4 4 4 4 8\n7 7 7 7 7 7 7 7 2 8 8 8 8 8 8 8 8 8 8 8\n\nTraining Example 2:\nInput:\n4 4 4 4 4 4 4 4 4 4 2 8 4 4 4 4 4 4 4 4\n4 3 4 4 4 4 4 4 4 4 2 4 1 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 2 2 2 2 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 2 5 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 0 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 1 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n\nOutput:\n4 4 4 4 4 4 4 4 4 4 2 8 8 8 8 8 8 8 8 8\n4 3 3 3 3 3 3 3 3 4 2 8 1 1 1 1 1 1 1 8\n4 3 4 4 4 4 4 4 3 4 2 8 1 8 8 8 8 8 1 8\n4 3 4 3 3 3 3 4 3 4 2 8 1 8 1 1 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 1 8 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 1 8 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 1 8 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 1 8 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 1 1 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 8 8 8 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 1 1 1 1 1 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 8 8 8 8 8 8 8 8\n4 3 4 3 4 4 3 4 3 4 2 2 2 2 2 2 2 2 2 2\n4 3 4 3 4 4 3 4 3 4 2 5 5 5 5 5 5 5 5 5\n4 3 4 3 4 4 3 4 3 4 2 5 0 0 0 0 0 0 0 5\n4 3 4 3 4 4 3 4 3 4 2 5 0 1 1 1 1 1 0 5\n4 3 4 3 3 3 3 4 3 4 2 5 0 1 5 5 5 1 0 5\n4 3 4 4 4 4 4 4 3 4 2 5 0 1 1 1 1 1 0 5\n4 3 3 3 3 3 3 3 3 4 2 5 0 0 0 0 0 0 0 5\n4 4 4 4 4 4 4 4 4 4 2 5 5 5 5 5 5 5 5 5\n\nTraining Example 3:\nInput:\n9 8 8 8 8 8 6 8 8 8 8 8 7\n8 1 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 6 6 6 6 6 6\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n\nOutput:\n9 9 9 9 9 9 6 7 7 7 7 7 7\n9 1 1 1 1 9 6 7 7 7 7 7 7\n9 1 9 9 1 9 6 7 7 7 7 7 7\n9 1 9 9 1 9 6 7 7 7 7 7 7\n9 1 9 9 1 9 6 7 7 7 7 7 7\n9 1 9 9 1 9 6 7 7 7 7 7 7\n9 1 9 9 1 9 6 6 6 6 6 6 6\n9 1 9 9 1 9 6 8 8 8 8 8 8\n9 1 1 1 1 9 6 8 8 8 8 8 8\n9 9 9 9 9 9 6 8 8 8 8 8 8\n\nTest Input 1:\n1 3 3 3 3 3 3 3 3 3 3 8 6 3 3 3 3 3 3 3 8 2 3 3 3 3 3 3 3 3\n3 2 3 3 3 3 3 3 3 3 3 8 3 4 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 5 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 8 8 8 8 8 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 4 3 3 3 3 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 3 1 3 3 3 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 8 8 8 8 8 8 8\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 8 8 8 8 8 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 8 3 4 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3\n\nTest Input 2:\n8 8 8 8 8 8 4 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 3 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 4 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 2 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n8 8 8 8 8 8 6 1 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 5 8 1 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 4 8 8 1 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 7 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 2 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 1 1 1 1 1 1 1 1 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 4 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 2 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 1 1 1 1 1 1 1 1\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 9 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 8 2 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 8, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 1, + 8, + 6, + 4, + 4, + 4, + 4, + 4, + 4, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 5, + 5, + 5, + 4, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 2, + 2, + 2, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 6, + 6, + 5, + 4, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 1, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 5, + 5, + 5, + 4, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 4, + 4, + 4, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 6, + 6, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 4, + 4, + 4, + 4, + 8, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 1, + 1, + 1, + 4, + 8, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 1, + 4, + 1, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 1, + 4, + 1, + 4, + 8, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 1, + 1, + 1, + 4, + 8, + 6, + 4, + 4, + 4, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 4, + 4, + 4, + 4, + 8, + 6, + 4, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 4, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 4, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 6, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 1, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 6, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 2, + 2, + 2, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 1, + 8, + 6, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 5, + 6, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 8, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 4, + 5, + 6, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 2, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 4, + 5, + 6, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 2, + 1, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 6, + 4, + 5, + 6, + 6, + 6, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 2, + 1, + 8, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 8, + 6, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 2, + 2, + 2, + 1, + 8, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 8, + 6, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 6 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ] + ], + [ + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 1, + 2, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 2 + ], + [ + 4, + 3, + 4, + 4, + 4, + 3, + 4, + 1, + 2, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 2 + ], + [ + 4, + 3, + 4, + 3, + 4, + 3, + 4, + 1, + 2, + 3, + 4, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 4, + 3, + 2 + ], + [ + 4, + 3, + 4, + 3, + 4, + 3, + 4, + 1, + 2, + 3, + 4, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 4, + 3, + 2 + ], + [ + 4, + 3, + 4, + 4, + 4, + 3, + 4, + 1, + 2, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 2 + ], + [ + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 1, + 2, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 6, + 5, + 5, + 5, + 5, + 5, + 6, + 1, + 2, + 7, + 7, + 7, + 7, + 7, + 7, + 2, + 1, + 4, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4 + ], + [ + 6, + 5, + 4, + 4, + 4, + 5, + 6, + 1, + 2, + 7, + 2, + 2, + 2, + 2, + 7, + 2, + 1, + 4, + 9, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 2, + 7, + 2, + 2, + 2, + 2, + 7, + 2, + 1, + 4, + 9, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 2, + 7, + 7, + 7, + 7, + 7, + 7, + 2, + 1, + 4, + 9, + 2, + 4, + 9, + 9, + 9, + 9, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 2, + 2, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 4, + 2, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 9, + 2, + 4, + 9, + 2, + 4, + 2, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 2, + 4, + 9, + 2, + 2, + 2, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 4, + 9, + 9, + 9, + 9, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 9, + 9, + 9, + 9, + 4, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 2, + 2, + 9, + 4, + 2, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 4, + 2, + 9, + 4, + 2, + 9, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 4, + 2, + 9, + 4, + 2, + 9, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 2, + 2, + 9, + 4, + 2, + 9, + 4, + 1, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 9, + 9, + 9, + 9, + 4, + 2, + 9, + 4, + 1, + 9, + 2, + 2, + 2, + 2, + 2, + 2, + 9 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 9, + 4, + 1, + 9, + 2, + 9, + 9, + 9, + 9, + 2, + 9 + ], + [ + 6, + 5, + 4, + 4, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 9, + 4, + 1, + 9, + 2, + 9, + 9, + 9, + 9, + 2, + 9 + ], + [ + 6, + 5, + 5, + 5, + 5, + 5, + 6, + 1, + 4, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4, + 1, + 9, + 2, + 2, + 2, + 2, + 2, + 2, + 9 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_88e364bc", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n7 7 7 7 7 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n7 1 1 2 7 0 0 0 0 0 0 0 0 0 0 5 2 1 1 5\n7 7 7 7 7 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n7 1 1 2 7 0 0 0 0 0 0 0 0 0 0 5 2 1 1 5\n7 7 7 7 7 0 0 0 7 7 7 7 7 0 0 5 5 5 5 5\n0 0 0 0 0 0 0 7 7 0 0 0 7 0 0 0 0 0 0 0\n0 0 0 0 0 0 7 7 0 4 0 0 7 0 0 0 0 0 0 0\n0 7 7 7 7 7 7 0 0 0 7 7 7 0 0 5 5 5 5 0\n0 7 0 0 0 0 0 0 0 7 7 0 0 5 5 5 0 0 5 0\n0 7 0 0 0 0 0 0 0 7 5 5 5 5 0 0 0 0 5 0\n0 7 7 0 4 0 0 0 0 7 5 0 0 0 0 0 0 5 5 0\n0 0 7 7 7 7 0 0 0 7 5 0 0 0 0 0 0 5 0 0\n0 0 0 0 0 7 7 7 7 7 5 0 0 0 0 4 0 5 0 0\n0 0 0 0 0 0 0 5 5 5 5 0 0 0 0 0 0 5 0 0\n0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 5 5 0\n0 5 0 0 4 0 5 0 0 0 0 0 0 0 0 0 0 0 5 0\n0 5 0 0 0 0 5 0 0 0 0 0 0 4 0 0 0 0 5 0\n0 5 5 0 0 0 5 5 0 0 0 0 0 0 0 0 0 5 5 0\n0 0 5 0 5 5 5 5 5 5 5 5 5 5 5 5 5 5 0 0\n0 0 5 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0\n\nOutput:\n7 7 7 7 7 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n7 1 1 2 7 0 0 0 0 0 0 0 0 0 0 5 2 1 1 5\n7 7 7 7 7 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n7 1 1 2 7 0 0 0 0 0 0 0 0 0 0 5 2 1 1 5\n7 7 7 7 7 0 0 0 7 7 7 7 7 0 0 5 5 5 5 5\n0 0 0 0 0 0 0 7 7 0 0 0 7 0 0 0 0 0 0 0\n0 0 0 0 0 0 7 7 0 0 0 4 7 0 0 0 0 0 0 0\n0 7 7 7 7 7 7 0 0 0 7 7 7 0 0 5 5 5 5 0\n0 7 0 0 0 0 0 0 0 7 7 0 0 5 5 5 0 0 5 0\n0 7 0 0 0 0 0 0 0 7 5 5 5 5 0 0 0 0 5 0\n0 7 7 0 0 0 0 0 4 7 5 0 0 0 0 0 0 5 5 0\n0 0 7 7 7 7 0 0 0 7 5 0 0 0 0 0 0 5 0 0\n0 0 0 0 0 7 7 7 7 7 5 4 0 0 0 0 0 5 0 0\n0 0 0 0 0 0 0 5 5 5 5 0 0 0 0 0 0 5 0 0\n0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 5 5 0\n0 5 4 0 0 0 5 0 0 0 0 0 0 0 0 0 0 0 5 0\n0 5 0 0 0 0 5 4 0 0 0 0 0 0 0 0 0 0 5 0\n0 5 5 0 0 0 5 5 0 0 0 0 0 0 0 0 0 5 5 0\n0 0 5 0 5 5 5 5 5 5 5 5 5 5 5 5 5 5 0 0\n0 0 5 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 1 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 5 1 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 1 5 5 2 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 2 5 5 5\n0 0 0 0 0 0 5 5 5 5 0 0 0 5 5 5 5 5 5 5\n0 0 0 0 0 5 5 0 0 5 5 0 0 0 0 0 0 0 0 0\n0 0 5 5 5 5 0 0 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 5 5 5 5 0 0 0 0\n0 0 5 4 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 5 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 0 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 0 0 0 0 5 5 5 0 0 4 0 0 5 5 0 0 0 0\n0 5 5 0 5 5 5 0 5 0 0 0 0 5 5 0 0 0 0 0\n0 0 5 5 5 0 0 0 5 0 0 0 5 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 1 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 5 1 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 1 5 5 2 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 2 5 5 5\n0 0 0 0 0 0 5 5 5 5 0 0 0 5 5 5 5 5 5 5\n0 0 0 0 0 5 5 0 0 5 5 0 0 0 0 0 0 0 0 0\n0 0 5 5 5 5 0 0 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 5 5 5 5 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 4 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 5 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 0 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 0 0 0 0 5 5 5 0 0 0 0 0 5 5 0 0 0 0\n0 5 5 0 5 5 5 0 5 0 0 0 4 5 5 0 0 0 0 0\n0 0 5 5 5 0 0 0 5 0 0 0 5 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTraining Example 3:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 1 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 1 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 2 5 2 5\n0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 5 5 5 5 5\n0 0 0 0 5 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0\n0 0 0 0 5 4 0 0 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0 0 0 5 0 0 0 0 0 0 0\n0 0 5 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0\n0 0 5 0 0 5 5 5 5 0 0 0 0 5 5 0 0 0 0 0\n0 0 5 5 5 5 0 0 5 5 5 5 5 5 5 5 5 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0\n0 0 5 5 0 0 4 0 0 0 4 0 0 0 0 0 5 0 0 0\n0 0 0 5 5 0 0 0 0 0 0 0 0 5 5 0 5 0 0 0\n0 0 0 0 5 0 0 5 5 0 0 0 5 5 5 5 5 0 0 0\n0 0 0 0 5 0 0 5 5 5 0 0 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 5 0 5 5 0 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 5 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 1 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 1 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 2 5 2 5\n0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 5 5 5 5 5\n0 0 0 0 5 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0 0 0 5 0 0 0 0 0 0 0\n0 0 5 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0\n0 0 5 0 0 4 0 0 0 0 0 0 0 5 5 0 0 0 0 0\n0 0 5 0 0 5 5 5 5 0 0 0 0 5 5 0 0 0 0 0\n0 0 5 5 5 5 0 0 5 5 5 5 5 5 5 5 5 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0\n0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0\n0 0 0 5 5 0 0 0 0 0 0 0 0 5 5 0 5 0 0 0\n0 0 0 0 5 0 0 5 5 0 0 0 5 5 5 5 5 0 0 0\n0 0 0 0 5 0 0 5 5 5 4 0 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 5 0 5 5 0 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 4 5 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTest Input 1:\n5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0\n5 5 5 1 5 5 5 0 0 5 5 5 0 0 0 0 0 0 0 0\n5 1 5 5 1 5 5 0 0 5 0 5 5 5 0 0 0 0 0 0\n5 5 1 5 5 2 5 0 0 5 0 4 0 5 0 0 5 5 0 0\n5 5 5 2 5 5 5 0 0 5 0 0 0 5 5 5 5 5 5 0\n5 5 5 5 5 5 5 0 0 5 0 0 0 0 0 0 0 0 5 0\n0 0 0 0 0 0 0 0 0 5 0 4 0 0 0 0 0 0 5 0\n0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 5 0\n0 0 0 0 0 1 1 1 1 1 5 0 0 0 0 0 0 0 5 0\n0 0 0 0 0 1 0 0 0 1 5 5 5 0 0 5 5 5 5 0\n0 0 0 0 0 1 0 0 0 1 1 1 5 5 5 5 0 0 0 0\n0 0 0 0 0 1 1 0 0 0 0 1 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 1 1 0 4 0 1 1 1 1 1 1 0 0 0\n0 0 0 0 0 0 0 0 1 0 0 0 0 1 0 0 1 1 0 0\n0 0 0 0 0 0 0 0 1 1 0 0 0 1 0 0 0 1 1 0\n1 1 1 1 1 0 0 0 0 1 1 1 1 1 0 0 0 0 1 0\n1 2 1 2 1 0 0 0 0 1 0 0 0 0 0 0 0 0 1 0\n1 5 1 5 1 0 0 0 0 1 0 0 0 0 0 0 4 0 1 0\n1 5 1 5 1 0 0 0 0 1 1 4 1 1 1 1 1 1 1 0\n1 1 1 1 1 0 0 0 0 0 1 1 1 0 0 0 0 0 0 0\n\nTest Input 2:\n6 6 6 6 6 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n6 2 6 2 6 0 0 3 3 3 3 3 3 3 0 0 6 6 6 6\n6 1 6 1 6 0 0 3 0 0 0 0 0 3 0 0 6 0 0 6\n6 1 6 1 6 0 3 3 0 0 0 0 0 3 6 6 6 6 0 6\n6 6 6 6 6 0 3 0 0 0 0 0 3 3 6 0 0 0 0 6\n0 0 0 0 0 0 3 0 0 0 0 0 3 0 6 0 4 0 0 6\n0 0 3 3 3 3 3 0 0 0 0 0 3 3 6 6 6 0 0 6\n0 0 3 0 0 0 0 0 0 4 0 0 0 3 3 0 6 0 0 6\n0 0 3 3 0 0 0 0 0 0 0 4 0 3 3 0 6 0 4 6\n0 0 0 3 3 3 3 3 3 3 3 3 3 3 0 0 6 6 0 6\n0 0 0 0 3 3 3 3 3 3 3 0 0 0 0 0 0 6 6 6\n0 0 0 0 3 0 0 0 0 0 3 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 3 0 0 0 0 0 0 0 0 0\n0 0 0 3 3 0 4 0 0 0 3 0 0 0 0 0 0 0 0 0\n0 0 3 3 0 0 0 0 0 0 3 0 0 3 3 3 3 3 3 3\n0 0 3 0 0 0 0 0 0 3 3 0 0 3 3 3 2 3 3 3\n0 0 3 0 0 0 0 0 0 3 0 0 0 3 2 3 3 1 3 3\n0 0 3 3 0 4 0 0 0 3 0 0 0 3 3 1 3 3 1 3\n0 0 0 3 3 3 0 0 3 3 0 0 0 3 3 3 1 3 3 3\n0 0 0 0 0 3 3 3 3 0 0 0 0 3 3 3 3 3 3 3\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 5, + 5, + 5, + 1, + 5, + 5, + 5, + 0, + 0, + 5, + 5, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 5, + 1, + 5, + 5, + 1, + 5, + 5, + 0, + 0, + 5, + 0, + 5, + 5, + 5, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 5, + 5, + 1, + 5, + 5, + 2, + 5, + 0, + 0, + 5, + 0, + 0, + 0, + 5, + 0, + 0, + 5, + 5, + 0, + 0 + ], + [ + 5, + 5, + 5, + 2, + 5, + 5, + 5, + 0, + 0, + 5, + 0, + 0, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 0 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 0, + 0, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 1, + 5, + 5, + 5, + 0, + 4, + 5, + 5, + 5, + 5, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 1, + 1, + 1, + 5, + 5, + 5, + 5, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 0, + 4, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 1, + 1, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 0, + 0, + 1, + 0, + 0, + 4, + 1, + 1, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 1, + 0 + ], + [ + 1, + 2, + 1, + 2, + 1, + 0, + 0, + 0, + 0, + 1, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0 + ], + [ + 1, + 5, + 1, + 5, + 1, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0 + ], + [ + 1, + 5, + 1, + 5, + 1, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 6, + 6, + 6, + 6, + 6, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 6, + 2, + 6, + 2, + 6, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 6, + 6, + 6, + 6 + ], + [ + 6, + 1, + 6, + 1, + 6, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 6, + 0, + 4, + 6 + ], + [ + 6, + 1, + 6, + 1, + 6, + 0, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 6, + 6, + 6, + 6, + 0, + 6 + ], + [ + 6, + 6, + 6, + 6, + 6, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 3, + 3, + 6, + 0, + 4, + 0, + 0, + 6 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 3, + 0, + 6, + 0, + 0, + 0, + 0, + 6 + ], + [ + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 6, + 6, + 6, + 0, + 0, + 6 + ], + [ + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 0, + 6, + 0, + 0, + 6 + ], + [ + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 0, + 6, + 0, + 0, + 6 + ], + [ + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 6, + 6, + 0, + 6 + ], + [ + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6 + ], + [ + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 0, + 0, + 3, + 3, + 3, + 2, + 3, + 3, + 3 + ], + [ + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 3, + 2, + 3, + 3, + 1, + 3, + 3 + ], + [ + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 3, + 3, + 1, + 3, + 3, + 1, + 3 + ], + [ + 0, + 0, + 0, + 3, + 3, + 3, + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 3, + 3, + 3, + 1, + 3, + 3, + 3 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_e3721c99", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 3 3 0 1 1 1 1 1 0 2 2 2 2 2 2 2 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 0 3 0 1 0 1 0 1 0 2 0 2 0 2 0 2 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 3 3 0 1 1 1 1 1 0 2 2 2 2 2 2 2 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 5 5 5 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 5 5 0 5 5 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 5 5 0 5 5 0 5 5 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 5 0 0 0 0\n0 0 0 5 5 5 5 0 0 0 0 0 5 5 0 0 0 0 0 5 5 0 0 0 5 5 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 5 5 0 0 0 5 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 5 5 5 5 0 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0 0\n0 0 0 0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0\n0 0 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 5 0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 5 5 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 5 5 5 5 0 0\n0 0 0 5 5 5 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 5 5 5 0 5 5 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 5 0 5 0 5 0 0 0 0 5 5 5 5 0 0 5 0 0\n0 0 0 0 0 0 5 5 5 5 0 0 5 5 5 5 5 5 0 0 0 5 5 0 5 5 5 5 0 0\n0 0 0 0 0 5 5 5 0 5 0 0 5 0 5 5 5 0 0 0 0 5 5 0 0 5 5 5 0 0\n0 0 0 5 5 5 5 5 0 5 0 0 5 5 5 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0\n0 0 5 5 5 5 0 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 5 5 0 5 0 5 5 5 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0 0\n0 0 5 5 5 5 5 5 5 5 0 0 0 0 0 0 5 5 5 5 5 5 0 0 0 0 0 0 0 0\n0 0 5 5 0 5 5 5 5 0 0 0 0 0 0 0 5 5 5 5 5 5 0 0 0 0 0 0 0 0\n0 0 0 5 5 5 5 5 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 3 3 0 1 1 1 1 1 0 2 2 2 2 2 2 2 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 0 3 0 1 0 1 0 1 0 2 0 2 0 2 0 2 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 3 3 0 1 1 1 1 1 0 2 2 2 2 2 2 2 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 4 4 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 3 3 3 0 0 0 4 4 4 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 3 3 0 3 3 0 4 4 4 4 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 3 3 0 3 3 0 4 4 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 0 0 0 0\n0 0 0 3 3 3 3 0 0 0 0 0 4 4 0 0 0 0 0 1 1 0 0 0 1 1 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 4 4 4 0 0 0 0 1 1 1 1 1 1 1 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 4 4 4 4 4 0 0 0 1 1 0 0 0 1 1 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 4 4 4 4 0 0 0 0 1 1 1 1 1 1 1 0 0 0 0 0 0\n0 0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 1 1 1 0 0 0 0 0 0 0 0 0\n0 0 0 3 3 3 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 3 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 3 3 3 3 0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 1 1 1 1 0 0\n0 0 0 3 3 3 0 0 0 0 0 0 2 2 2 2 2 0 0 0 0 0 1 1 1 0 1 1 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 0 2 0 2 0 0 0 0 1 1 1 1 0 0 1 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 2 2 0 0 0 1 1 0 1 1 1 1 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 0 2 2 2 0 0 0 0 1 1 0 0 1 1 1 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 0 0 0 0 0 0 0 1 1 1 1 1 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 4 4 4 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 4 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 4 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 4 4 4 0 0 0 0 0 0 0 0 0 0\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 2 2 0 3 3 3 0 1 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0\n0 2 2 2 0 3 0 3 0 1 0 0 0 0 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0 0\n0 2 2 2 0 3 3 3 0 1 0 0 0 5 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 1 0 0 0 5 5 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 1 0 0 0 0 5 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 0 0 0 0 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 0 0\n0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 5 5 5 5 5 5 5 5 0 0\n0 0 0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 5 5 5 0 0 5 5 5 0 0\n0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 5 5 5 5 0\n0 0 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 5 5 5 5 0\n0 0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 5 5 0 0 0 5 5 5 5 0\n0 0 5 5 5 5 5 5 5 0 0 0 5 5 5 5 0 0 0 0 5 5 5 5 5 5 5 5 0 0\n0 5 5 5 5 5 5 5 5 0 0 0 5 5 5 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0\n0 0 5 5 5 5 5 5 0 0 0 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 5 5 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 5 5 0 5 5 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 5 0 0 5 5 0 0 0 0 0\n0 0 0 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 5 0 0 0 0 0 0\n0 0 0 0 5 0 0 5 5 0 0 0 5 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0\n0 0 0 5 5 0 0 5 0 0 0 5 5 5 5 5 5 5 0 0 5 5 5 5 0 0 0 0 0 0\n0 0 0 5 5 0 5 5 0 0 0 5 0 5 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 5 5 5 5 0 0 0 5 0 5 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 5 0 0 0 0 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 2 2 0 3 3 3 0 1 0 0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 0 0\n0 2 2 2 0 3 0 3 0 1 0 0 0 0 2 2 2 2 2 2 2 2 2 2 0 0 0 0 0 0\n0 2 2 2 0 3 3 3 0 1 0 0 0 2 2 2 2 2 2 2 2 2 2 2 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 1 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 1 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 0 0 0 0 2 2 2 2 2 2 2 2 2 2 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 2 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 3 3 0 0\n0 0 0 0 0 0 0 0 0 0 2 2 2 0 0 0 0 0 0 0 3 3 3 3 3 3 3 3 0 0\n0 0 0 0 0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 3 3 3 0 0 3 3 3 0 0\n0 0 0 0 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 3 3 3 0 0 0 3 3 3 3 0\n0 0 2 2 2 2 2 2 0 0 0 0 0 0 0 0 0 0 0 3 3 3 0 0 0 3 3 3 3 0\n0 0 2 2 2 2 2 2 2 0 0 0 0 0 0 0 0 0 0 0 3 3 0 0 0 3 3 3 3 0\n0 0 2 2 2 2 2 2 2 0 0 0 2 2 2 2 0 0 0 0 3 3 3 3 3 3 3 3 0 0\n0 2 2 2 2 2 2 2 2 0 0 0 2 2 2 0 0 0 0 0 0 3 3 0 0 0 0 0 0 0\n0 0 2 2 2 2 2 2 0 0 0 0 2 2 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 2 2 0 0 0 0 0 2 2 2 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 0 0 0 0 0 3 3 3 3 3 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 0 0 0 0 0 3 3 0 3 3 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 0 0 0 0 0 3 0 0 3 3 0 0 0 0 0\n0 0 0 0 3 3 3 3 0 0 0 0 0 0 0 0 0 0 0 0 3 0 0 3 0 0 0 0 0 0\n0 0 0 0 3 0 0 3 3 0 0 0 0 0 0 0 0 0 0 0 3 3 3 3 3 0 0 0 0 0\n0 0 0 3 3 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 3 3 3 3 0 0 0 0 0 0\n0 0 0 3 3 0 3 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 3 3 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTest Input 1:\n0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 5 5 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 1 0 8 8 8 0\n0 5 5 5 5 5 5 5 0 5 5 5 0 0 5 5 5 5 5 0 0 0 0 0 1 0 8 0 8 0\n0 5 0 5 5 0 0 5 0 0 0 0 0 5 5 0 0 0 5 0 0 0 0 0 1 0 8 8 8 0\n0 5 0 0 5 0 0 5 0 0 0 0 0 5 0 0 0 0 5 0 5 5 5 0 1 0 8 0 8 0\n0 5 5 5 5 0 0 5 0 0 0 0 0 5 5 0 0 5 5 0 5 0 5 0 1 0 8 8 8 0\n0 0 5 5 5 0 5 5 0 0 0 0 0 0 5 5 5 5 0 0 5 5 5 0 1 0 0 0 0 0\n0 0 0 0 5 5 5 0 0 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 1 0 6 6 6 0\n5 5 0 0 0 0 0 0 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 1 0 6 0 6 0\n5 5 0 0 0 0 0 0 0 5 5 5 5 0 0 0 5 5 5 5 5 5 0 0 1 0 6 6 6 0\n5 5 5 0 0 0 0 0 0 0 5 5 0 0 5 5 5 0 0 5 5 5 5 0 1 0 6 0 6 0\n5 5 5 0 0 5 5 5 0 0 0 0 0 5 5 5 5 0 5 5 0 0 5 0 1 0 6 6 6 0\n5 5 5 0 5 5 0 5 5 5 5 0 0 5 0 0 5 5 5 0 0 0 5 0 1 0 6 0 6 0\n5 5 0 0 5 0 0 0 5 0 5 0 0 5 0 0 0 5 5 5 0 0 5 0 1 0 6 6 6 0\n0 0 0 0 5 5 0 0 5 5 5 0 0 5 5 0 0 5 0 5 5 5 5 0 1 0 6 0 6 0\n0 0 0 0 0 5 5 5 5 5 5 5 0 0 5 5 5 5 0 0 0 5 5 0 1 0 6 6 6 0\n0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 5 5 5 5 0 5 0 0 1 0 0 0 0 0\n0 0 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 5 5 5 0 0 1 0 4 4 4 0\n0 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 4 0 4 0\n5 5 5 5 5 5 5 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 1 0 4 4 4 0\n0 5 5 5 5 5 5 0 0 5 5 5 5 0 0 0 5 5 5 5 0 0 0 0 1 0 4 0 4 0\n0 0 0 0 0 0 0 0 0 5 0 0 5 0 0 0 0 0 5 5 5 5 0 0 1 0 4 4 4 0\n0 0 0 0 0 0 0 0 5 5 0 0 5 0 0 0 0 5 5 0 5 5 0 0 1 0 4 0 4 0\n0 5 5 0 0 0 0 5 5 0 0 0 5 0 0 0 5 5 0 0 5 0 0 0 1 0 4 4 4 0\n0 5 5 5 0 0 5 5 5 0 0 0 5 0 0 5 5 0 0 0 5 0 0 0 1 0 4 0 4 0\n0 5 5 5 0 5 5 0 5 5 5 5 5 5 5 5 0 0 0 0 5 0 0 0 1 0 4 4 4 0\n0 5 5 0 0 5 0 0 0 5 5 5 0 5 5 0 0 0 0 0 5 0 0 0 1 0 4 0 4 0\n0 0 0 0 0 5 0 0 0 0 5 0 0 0 5 0 0 0 0 5 5 0 0 0 1 0 4 4 4 0\n0 0 0 0 0 5 5 0 0 0 5 0 0 0 5 0 0 0 5 5 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 5 5 5 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0 1 0 0 0 0 0\n\nTest Input 2:\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 4 4 0 1 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 4 0 1 0 0 5 5 5 5 5 5 5 5 0 0 0 0 5 5 5 5 5 0 0 0 0 0\n0 4 4 4 0 1 0 0 5 5 5 5 5 0 0 5 0 0 5 5 5 5 0 5 5 0 0 0 0 0\n0 0 0 0 0 1 0 0 5 5 5 5 5 5 5 5 0 0 5 5 5 5 5 5 5 5 0 0 0 0\n0 7 7 7 0 1 0 0 0 0 5 5 5 5 0 0 0 0 5 0 5 5 5 5 5 5 5 0 0 0\n0 7 0 7 0 1 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 5 5 5 5 0 0 0\n0 7 7 7 0 1 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0\n0 7 0 7 0 1 0 0 0 0 0 0 5 5 5 5 0 0 5 5 5 5 5 5 0 0 0 0 0 0\n0 7 7 7 0 1 0 0 0 0 0 0 5 0 0 5 0 0 0 0 0 5 5 0 0 0 5 5 5 5\n0 0 0 0 0 1 0 0 0 0 0 5 5 5 5 5 5 0 0 0 0 0 0 0 0 5 5 5 5 5\n0 2 2 2 0 1 0 0 0 0 5 5 5 0 5 5 5 0 0 0 0 0 0 0 0 5 5 5 5 0\n0 2 0 2 0 1 0 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 5 5 5 5 0\n0 2 2 2 0 1 0 0 0 0 0 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 5 0 0\n0 2 0 2 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 2 2 0 1 0 0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 5 5 5 5 0 0 0 0\n0 2 0 2 0 1 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 5 5 5 0 5 5 5 0 0\n0 2 2 2 0 1 0 0 0 0 0 0 0 0 0 0 5 5 0 0 5 5 5 5 0 5 5 5 0 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 5 0 5 5 5 5 5 5 5 0 0\n0 1 1 1 0 1 0 0 0 5 5 5 5 5 0 0 0 0 0 5 0 0 5 5 5 5 5 0 0 0\n0 1 0 1 0 1 0 5 5 0 0 5 0 5 0 0 0 0 0 5 5 0 0 5 5 5 5 0 0 0\n0 1 1 1 0 1 0 5 5 5 5 5 5 5 5 0 0 0 0 0 5 5 5 5 5 5 5 0 0 0\n0 1 0 1 0 1 0 5 5 5 5 5 5 5 5 0 0 0 0 0 5 5 0 0 5 5 5 0 0 0\n0 1 1 1 0 1 0 5 5 5 5 5 5 5 5 0 0 0 0 0 5 5 0 0 5 5 0 0 0 0\n0 1 0 1 0 1 0 5 5 5 5 5 5 5 5 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0\n0 1 1 1 0 1 0 5 5 5 5 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 1 0 1 0 1 0 5 5 0 5 5 5 5 5 0 0 0 5 0 0 0 0 0 0 0 5 5 5 0\n0 1 1 1 0 1 0 0 5 5 5 5 5 5 0 0 0 0 5 5 5 0 0 0 0 0 5 5 5 0\n0 0 0 0 0 1 0 0 0 0 0 5 5 0 0 0 0 5 5 5 5 5 0 0 0 0 5 5 5 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 8, + 8, + 8, + 0 + ], + [ + 0, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 8, + 0, + 8, + 0 + ], + [ + 0, + 8, + 0, + 8, + 8, + 0, + 0, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 8, + 8, + 8, + 0 + ], + [ + 0, + 8, + 0, + 0, + 8, + 0, + 0, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 8, + 0, + 8, + 0 + ], + [ + 0, + 8, + 8, + 8, + 8, + 0, + 0, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 8, + 8, + 8, + 0 + ], + [ + 0, + 0, + 8, + 8, + 8, + 0, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 6, + 6, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 6, + 0, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 6, + 6, + 6, + 0, + 0, + 1, + 0, + 6, + 6, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 0, + 0, + 6, + 6, + 6, + 6, + 0, + 1, + 0, + 6, + 0, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 6, + 0, + 6, + 6, + 0, + 0, + 6, + 0, + 1, + 0, + 6, + 6, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 8, + 0, + 8, + 8, + 8, + 8, + 0, + 0, + 6, + 0, + 0, + 6, + 6, + 6, + 0, + 0, + 0, + 6, + 0, + 1, + 0, + 6, + 0, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 0, + 0, + 0, + 8, + 0, + 8, + 0, + 0, + 6, + 0, + 0, + 0, + 6, + 6, + 6, + 0, + 0, + 6, + 0, + 1, + 0, + 6, + 6, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 8, + 0, + 0, + 8, + 8, + 8, + 0, + 0, + 6, + 6, + 0, + 0, + 6, + 0, + 6, + 6, + 6, + 6, + 0, + 1, + 0, + 6, + 0, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 0, + 0, + 6, + 6, + 6, + 6, + 0, + 0, + 0, + 6, + 6, + 0, + 1, + 0, + 6, + 6, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 0, + 0, + 0, + 6, + 6, + 6, + 6, + 0, + 6, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 1, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 4, + 4, + 0, + 0, + 1, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 4, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 1, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 4, + 4, + 0, + 4, + 4, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 1, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 4, + 4, + 4, + 0, + 1, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 4, + 0, + 4, + 0, + 1, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 4, + 4, + 4, + 0, + 1, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 4, + 0, + 0, + 7, + 7, + 7, + 7, + 0, + 7, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0 + ], + [ + 0, + 7, + 7, + 7, + 0, + 1, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0 + ], + [ + 0, + 7, + 0, + 7, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0 + ], + [ + 0, + 7, + 7, + 7, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 7, + 0, + 7, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 7, + 7, + 7, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 2, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 0, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 2, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 0, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 2, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 0, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 0, + 2, + 2, + 2, + 0, + 0 + ], + [ + 0, + 2, + 2, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 0, + 2, + 2, + 2, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 0, + 0 + ], + [ + 0, + 1, + 1, + 1, + 0, + 1, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 0, + 0, + 0 + ], + [ + 0, + 1, + 0, + 1, + 0, + 1, + 0, + 1, + 1, + 0, + 0, + 1, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 0, + 0, + 2, + 2, + 2, + 2, + 0, + 0, + 0 + ], + [ + 0, + 1, + 1, + 1, + 0, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 0, + 0, + 0 + ], + [ + 0, + 1, + 0, + 1, + 0, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 0, + 0, + 2, + 2, + 2, + 0, + 0, + 0 + ], + [ + 0, + 1, + 1, + 1, + 0, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 0, + 0, + 2, + 2, + 0, + 0, + 0, + 0 + ], + [ + 0, + 1, + 0, + 1, + 0, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 1, + 1, + 1, + 0, + 1, + 0, + 1, + 1, + 1, + 1, + 0, + 0, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 1, + 0, + 1, + 0, + 1, + 0, + 1, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 1, + 1, + 1, + 0, + 1, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_5dbc8537", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n9 4 4 4 4 4 9 4 4 4 4 4 4 4 4\n9 4 4 4 4 4 9 4 4 4 8 8 8 8 8\n9 9 4 4 9 9 9 4 4 4 8 8 8 8 8\n9 9 4 4 9 9 9 4 4 4 4 4 4 4 4\n9 9 4 4 9 9 9 4 3 3 4 1 1 4 4\n9 9 4 4 9 9 9 4 3 3 4 1 1 4 4\n9 9 4 4 4 9 9 4 3 3 4 4 4 4 4\n9 9 4 4 9 9 9 4 3 3 4 5 5 5 5\n9 4 4 9 9 9 9 4 3 3 4 4 4 4 4\n9 4 4 9 9 9 9 4 3 3 4 4 4 4 4\n9 9 4 4 4 4 9 4 4 4 4 4 4 7 7\n9 9 9 4 4 9 9 4 5 5 5 5 4 7 7\n9 9 9 4 4 9 9 4 4 4 4 4 4 7 7\n9 9 9 4 4 9 9 4 4 0 4 4 4 4 4\n9 9 4 4 4 4 9 4 4 4 4 4 4 4 4\n\nOutput:\n9 8 8 8 8 8 9\n9 8 8 8 8 8 9\n9 9 3 3 9 9 9\n9 9 3 3 9 9 9\n9 9 3 3 9 9 9\n9 9 3 3 9 9 9\n9 9 3 3 0 9 9\n9 9 3 3 9 9 9\n9 1 1 9 9 9 9\n9 1 1 9 9 9 9\n9 9 5 5 5 5 9\n9 9 9 7 7 9 9\n9 9 9 7 7 9 9\n9 9 9 7 7 9 9\n9 9 5 5 5 5 9\n\nTraining Example 2:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 4 7 4 7 4 7 8 8 8 6 6 8 8 8 8 8 8 8 8\n8 7 4 7 4 7 4 8 9 8 6 6 8 8 1 1 1 8 8 8\n8 4 7 4 7 4 7 8 9 8 6 6 8 8 1 9 1 8 8 8\n8 7 4 7 4 7 4 8 9 8 6 6 8 8 1 1 1 8 0 8\n8 8 8 8 8 8 8 8 9 8 6 6 8 8 1 9 1 8 8 8\n8 8 5 5 8 8 8 8 9 8 8 8 8 8 1 1 1 8 8 8\n8 8 5 5 8 8 8 8 8 8 8 8 8 8 8 8 8 8 0 8\n8 8 5 5 8 8 3 3 3 8 8 8 8 8 8 4 4 8 8 8\n8 8 5 5 8 8 3 3 3 8 8 8 8 8 8 4 4 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 8 2 2 2 2 2 8 8 2 2 2 2 2 2 2\n2 2 2 2 8 8 8 2 2 2 8 8 8 2 2 2 2 2 2 2\n8 8 8 8 8 8 8 2 2 2 8 8 8 8 8 8 8 8 8 2\n8 8 8 8 8 8 8 2 2 2 8 8 8 8 8 8 8 8 8 8\n2 2 8 8 8 8 8 2 2 2 8 2 2 8 8 8 8 8 8 2\n2 2 8 8 8 8 8 8 8 8 8 2 2 8 8 8 8 8 8 2\n2 2 8 8 2 2 2 8 8 8 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nOutput:\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 0 2 2 2 2 2 5 5 2 2 2 2 2 2 2\n2 2 2 2 1 1 1 2 2 2 9 5 5 2 2 2 2 2 2 2\n4 4 6 6 1 9 1 2 2 2 9 5 5 4 7 4 7 4 7 2\n4 4 6 6 1 1 1 2 2 2 9 5 5 7 4 7 4 7 4 0\n2 2 6 6 1 9 1 2 2 2 9 2 2 4 7 4 7 4 7 2\n2 2 6 6 1 1 1 3 3 3 9 2 2 7 4 7 4 7 4 2\n2 2 6 6 2 2 2 3 3 3 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nTest Input 1:\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 1 1 3 3 1 1 3 3 3 3 1 3 3 3 3 3 3 3 3 1 1 3\n1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1 3 3 1 3 1 1 1 1 3\n1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1 1 1 1 1 1 1 1 1 3\n1 1 1 1 1 3 3 1 1 3 3 1 1 1 1 1 1 1 1 1 1 1 1 1 3\n1 1 1 1 1 3 3 1 1 1 1 1 1 1 1 1 3 3 1 3 3 3 1 1 1\n1 1 1 1 1 3 1 1 1 1 1 1 1 1 1 1 3 3 3 3 3 3 1 1 1\n1 1 1 1 1 3 3 1 1 3 3 1 1 1 1 1 3 3 3 3 3 3 1 1 1\n1 1 1 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 1 1 1\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 9 9 1 1 1 1 6 6 6 6 6 1 1 1 4 4 1 1 2 2 2 1 1 1\n1 9 9 1 1 1 1 6 8 6 8 6 1 1 1 4 4 1 1 2 5 2 1 1 1\n1 9 9 1 1 1 1 6 6 8 6 6 1 1 1 4 4 1 1 2 2 2 1 1 1\n1 9 9 1 1 1 1 6 8 6 8 6 1 1 1 4 4 1 1 2 5 2 1 1 1\n1 9 9 1 1 1 1 6 6 8 6 6 1 1 1 4 4 1 1 2 2 2 1 1 1\n1 9 9 1 1 1 1 6 6 6 6 6 1 1 1 4 4 1 1 2 5 2 1 1 1\n1 9 9 1 4 4 1 1 1 1 1 1 1 1 1 9 9 1 1 2 2 2 1 1 1\n1 9 9 1 4 4 1 7 7 7 7 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 4 4 1 7 7 7 7 1 1 1 1 1 1 1 1 1 1 1 8 8 1\n1 1 1 1 4 4 1 1 1 1 1 1 1 1 5 5 1 1 1 6 1 1 8 8 1\n1 8 8 1 4 4 1 0 1 0 1 1 1 1 5 5 1 1 1 6 1 1 1 1 1\n1 8 8 1 4 4 1 1 1 1 1 1 1 1 5 5 1 1 1 6 1 1 1 1 1\n1 1 1 1 9 9 1 0 1 0 1 1 1 1 1 1 1 1 1 6 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTest Input 2:\n1 3 3 1 1 1 1 1 3 3 3 3 3 3 3 3 3 3 3 3\n1 1 3 3 1 1 1 1 3 4 7 4 7 3 9 9 9 8 3 3\n1 1 1 3 3 1 1 1 3 7 4 7 4 3 8 9 9 9 3 3\n1 1 1 1 3 3 1 1 3 4 7 4 7 3 3 3 3 3 3 3\n1 3 3 3 3 3 3 1 3 3 3 3 3 3 3 3 6 6 3 3\n1 3 3 3 3 3 3 1 3 6 6 3 3 3 3 3 6 6 3 3\n1 1 3 3 1 3 1 1 3 6 6 3 3 3 3 3 3 3 3 3\n1 1 3 3 1 1 1 1 3 3 3 3 3 5 5 3 3 3 3 3\n1 3 3 3 1 1 1 1 3 4 4 9 3 3 3 3 3 3 3 3\n1 3 3 3 1 1 1 1 3 9 4 4 3 3 3 5 5 3 3 3\n1 1 3 3 3 1 1 1 3 3 3 3 3 3 3 3 3 3 3 3\n1 1 1 3 3 3 3 1 3 3 8 8 8 3 3 3 3 3 3 3\n1 1 1 3 3 3 3 1 3 3 3 3 3 3 3 3 3 3 0 3\n1 3 3 3 3 1 1 1 3 3 2 2 2 2 2 2 3 3 3 3\n1 3 3 3 3 1 1 1 3 3 2 2 2 2 2 2 3 3 0 3\n1 3 3 3 3 1 1 1 3 3 3 3 3 3 3 3 3 3 3 3\n1 1 1 3 3 3 1 1 3 3 3 3 3 5 5 3 3 3 0 3\n1 1 1 3 3 1 1 1 3 4 4 9 3 3 3 3 3 3 3 3\n1 1 3 3 3 3 1 1 3 9 4 4 3 3 5 5 3 3 3 3\n1 1 3 3 3 1 1 1 3 3 3 3 3 3 3 3 3 3 3 3\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 4, + 4, + 3, + 3, + 4, + 4, + 3, + 3, + 3, + 3, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 3 + ], + [ + 2, + 2, + 2, + 4, + 4, + 8, + 8, + 4, + 4, + 3, + 3, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 0, + 3, + 5, + 5, + 9, + 9, + 3 + ], + [ + 2, + 5, + 2, + 4, + 4, + 8, + 8, + 4, + 4, + 3, + 3, + 6, + 8, + 6, + 8, + 6, + 7, + 7, + 7, + 7, + 5, + 5, + 9, + 9, + 3 + ], + [ + 2, + 2, + 2, + 4, + 4, + 3, + 3, + 4, + 4, + 3, + 3, + 6, + 6, + 8, + 6, + 6, + 7, + 7, + 7, + 7, + 5, + 5, + 9, + 9, + 3 + ], + [ + 2, + 5, + 2, + 4, + 4, + 3, + 3, + 4, + 4, + 8, + 8, + 6, + 8, + 6, + 8, + 6, + 3, + 3, + 0, + 3, + 3, + 3, + 9, + 9, + 6 + ], + [ + 2, + 2, + 2, + 4, + 4, + 3, + 0, + 4, + 4, + 8, + 8, + 6, + 6, + 8, + 6, + 6, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 6 + ], + [ + 2, + 5, + 2, + 9, + 9, + 3, + 3, + 9, + 9, + 3, + 3, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 6 + ], + [ + 2, + 2, + 2, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 6 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ] + ], + [ + [ + 1, + 5, + 5, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 5, + 5, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 5, + 5, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 5, + 5, + 1, + 1 + ], + [ + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 1 + ], + [ + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 1 + ], + [ + 1, + 1, + 6, + 6, + 1, + 0, + 1, + 1 + ], + [ + 1, + 1, + 6, + 6, + 1, + 1, + 1, + 1 + ], + [ + 1, + 4, + 4, + 9, + 1, + 1, + 1, + 1 + ], + [ + 1, + 9, + 4, + 4, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 8, + 8, + 8, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 9, + 9, + 9, + 8, + 1 + ], + [ + 1, + 1, + 1, + 8, + 9, + 9, + 9, + 1 + ], + [ + 1, + 4, + 7, + 4, + 7, + 1, + 1, + 1 + ], + [ + 1, + 7, + 4, + 7, + 4, + 1, + 1, + 1 + ], + [ + 1, + 4, + 7, + 4, + 7, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 6, + 6, + 0, + 1, + 1 + ], + [ + 1, + 1, + 1, + 6, + 6, + 1, + 1, + 1 + ], + [ + 1, + 1, + 4, + 4, + 9, + 0, + 1, + 1 + ], + [ + 1, + 1, + 9, + 4, + 4, + 1, + 1, + 1 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_d35bdbdc", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 3 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0 3 3 3\n0 0 5 5 5 5 5 3 4 3\n0 5 0 0 0 0 0 3 3 3\n0 5 4 4 4 0 0 0 0 0\n5 0 4 2 4 0 0 6 6 6\n0 5 4 4 4 0 5 6 1 6\n0 5 5 5 5 5 0 6 6 6\n0 0 1 1 1 0 0 0 0 0\n0 0 1 3 1 0 0 0 0 0\n0 0 1 1 1 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 3 3 3\n0 0 5 5 5 5 5 3 2 3\n0 5 0 0 0 0 0 3 3 3\n0 5 0 0 0 0 0 0 0 0\n5 0 0 0 0 0 0 6 6 6\n0 5 0 0 0 0 5 6 3 6\n0 5 5 5 5 5 0 6 6 6\n0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0\n\nTraining Example 2:\nInput:\n2 2 2 0 0 0 3 3 3 0\n2 6 2 0 0 0 3 2 3 0\n2 2 2 0 5 0 3 3 3 0\n0 0 0 5 0 5 5 5 5 0\n8 8 8 0 5 0 0 1 1 1\n8 3 8 0 0 5 0 1 4 1\n8 8 8 0 5 0 0 1 1 1\n0 5 0 5 4 4 4 0 0 0\n0 5 5 0 4 8 4 0 0 0\n0 0 0 0 4 4 4 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n0 0 0 5 0 5 5 5 5 0\n8 8 8 0 5 0 0 1 1 1\n8 2 8 0 0 5 0 1 8 1\n8 8 8 0 5 0 0 1 1 1\n0 5 0 5 0 0 0 0 0 0\n0 5 5 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0\n\nTraining Example 3:\nInput:\n1 1 1 0 0 0 0 4 4 4\n1 2 1 0 0 0 0 4 3 4\n1 1 1 0 0 5 0 4 4 4\n0 5 0 0 5 0 5 0 0 0\n0 5 0 5 3 3 3 5 0 0\n0 0 5 0 3 6 3 0 5 0\n0 0 0 0 3 3 3 0 5 0\n2 2 2 0 0 0 0 7 7 7\n2 9 2 0 0 0 0 7 4 7\n2 2 2 0 0 0 0 7 7 7\n\nOutput:\n1 1 1 0 0 0 0 0 0 0\n1 9 1 0 0 0 0 0 0 0\n1 1 1 0 0 5 0 0 0 0\n0 5 0 0 5 0 5 0 0 0\n0 5 0 5 0 0 0 5 0 0\n0 0 5 0 0 0 0 0 5 0\n0 0 0 0 0 0 0 0 5 0\n0 0 0 0 0 0 0 7 7 7\n0 0 0 0 0 0 0 7 3 7\n0 0 0 0 0 0 0 7 7 7\n\nTest Input 1:\n0 0 0 0 0 0 0 2 0 0\n0 0 4 0 0 0 2 3 2 0\n0 4 2 4 0 0 0 2 0 0\n0 0 4 0 0 0 0 5 0 0\n0 0 0 0 0 0 5 0 0 0\n0 0 0 0 1 0 5 0 3 0\n0 7 0 1 9 1 5 3 3 3\n7 1 7 0 1 0 5 0 3 0\n0 7 0 5 0 5 0 0 0 0\n0 5 5 0 5 0 0 0 0 0\n\nTest Input 2:\n0 0 0 4 4 4 0 2 2 2\n0 0 5 4 2 4 5 2 3 2\n0 0 5 4 4 4 5 2 2 2\n0 0 0 5 0 0 5 5 5 5\n0 0 5 1 1 1 0 0 0 5\n0 5 0 1 3 1 5 5 5 0\n0 0 5 1 1 1 5 3 3 3\n6 6 6 5 0 0 5 3 6 3\n6 9 6 5 5 5 5 3 3 3\n6 6 6 0 0 0 0 0 0 0\n\nTest Input 3:\n0 0 0 1 1 1 0 6 6 6\n0 0 0 1 3 1 0 6 1 6\n0 0 0 1 1 1 0 6 6 6\n5 5 5 5 5 0 0 0 5 0\n5 2 2 2 5 0 0 0 5 0\n5 2 4 2 5 3 3 3 5 0\n5 2 2 2 5 3 9 3 0 5\n0 5 5 0 5 3 3 3 0 5\n0 7 7 7 0 5 5 0 0 5\n0 7 2 7 0 0 0 5 5 0\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 3, + 2, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 7, + 9, + 7, + 0, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 0, + 7, + 0, + 5, + 0, + 5, + 0, + 0, + 0, + 0 + ], + [ + 0, + 5, + 5, + 0, + 5, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 0, + 0, + 0, + 4, + 4, + 4, + 0, + 2, + 2, + 2 + ], + [ + 0, + 0, + 5, + 4, + 3, + 4, + 5, + 2, + 6, + 2 + ], + [ + 0, + 0, + 5, + 4, + 4, + 4, + 5, + 2, + 2, + 2 + ], + [ + 0, + 0, + 0, + 5, + 0, + 0, + 5, + 5, + 5, + 5 + ], + [ + 0, + 0, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 5 + ], + [ + 0, + 5, + 0, + 0, + 0, + 0, + 5, + 5, + 5, + 0 + ], + [ + 0, + 0, + 5, + 0, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 5, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 5, + 5, + 5, + 5, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 3, + 6 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6 + ], + [ + 5, + 5, + 5, + 5, + 5, + 0, + 0, + 0, + 5, + 0 + ], + [ + 5, + 0, + 0, + 0, + 5, + 0, + 0, + 0, + 5, + 0 + ], + [ + 5, + 0, + 0, + 0, + 5, + 0, + 0, + 0, + 5, + 0 + ], + [ + 5, + 0, + 0, + 0, + 5, + 0, + 0, + 0, + 0, + 5 + ], + [ + 0, + 5, + 5, + 0, + 5, + 0, + 0, + 0, + 0, + 5 + ], + [ + 0, + 7, + 7, + 7, + 0, + 5, + 5, + 0, + 0, + 5 + ], + [ + 0, + 7, + 4, + 7, + 0, + 0, + 0, + 5, + 5, + 0 + ] + ] + ], + "num_test_pairs": 3, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_8e5c0c38", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 1 1 1 8 1 1 1 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 1 1 8 8 8 8 8 1 1 8 8 6 6 6 6 8 8 8\n8 8 8 8 8 1 8 8 8 8 8 1 8 8 8 8 6 8 6 8 8 8\n8 8 8 8 1 1 8 1 1 1 8 1 8 8 8 8 6 6 6 8 8 8\n8 8 8 8 1 1 1 1 8 1 1 1 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 2 8 8 8 2 2 2 8 8 8 8\n8 8 8 8 8 8 8 8 8 2 2 8 2 2 2 8 2 2 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 2 2 8 8 8 2 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 1 1 1 8 1 1 1 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 1 1 8 8 8 8 8 1 1 8 8 8 6 6 6 8 8 8\n8 8 8 8 8 1 8 8 8 8 8 1 8 8 8 8 6 8 6 8 8 8\n8 8 8 8 8 1 8 1 1 1 8 1 8 8 8 8 6 6 6 8 8 8\n8 8 8 8 8 1 1 1 8 1 1 1 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 2 8 8 8 2 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 2 2 8 2 2 2 8 2 2 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 2 8 8 8 2 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 0 0 2 2 0 0\n0 0 0 0 0 0 0 8 0 0 0 0 0 0 2 2 0 0 2 2 0 0\n0 0 0 0 0 8 8 0 8 0 0 0 0 0 0 2 2 2 2 0 0 0\n0 0 0 0 0 8 8 0 8 0 0 0 0 0 0 0 2 2 0 0 0 0\n0 0 0 0 0 0 0 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 4 4 4 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 4 4 4 0 0 0 4 4 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 4 4 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2 0 0 2 2 0 0\n0 0 0 0 0 0 0 8 0 0 0 0 0 0 2 2 0 0 2 2 0 0\n0 0 0 0 0 0 8 0 8 0 0 0 0 0 0 2 2 2 2 0 0 0\n0 0 0 0 0 0 8 0 8 0 0 0 0 0 0 0 2 2 0 0 0 0\n0 0 0 0 0 0 0 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 4 4 4 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 4 4 0 0 0 4 4 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 4 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTest Input 1:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 6 6 6 6 1 6 6 6 6 6 6 1 1 1 1 1 1\n1 1 1 1 1 6 6 1 1 1 1 1 1 6 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 6 1 1 1 1 1 1 6 1 1 1 1 1 1 1 1\n1 1 1 6 6 6 6 1 1 1 6 1 1 6 6 6 1 1 1 1 1 1\n1 1 1 6 6 6 6 1 6 6 6 6 1 6 6 6 1 1 1 1 1 1\n1 1 1 1 1 1 6 6 6 1 1 6 6 6 6 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 6 1 1 1 1 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 6 6 6 6 6 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 6 6 1 1 1 1 6 6 6 6 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 6 6 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 6 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 1 3 3 1\n1 1 1 1 1 1 4 1 1 1 1 1 1 1 1 1 1 3 3 3 3 1\n1 1 1 1 1 4 4 4 4 1 1 1 1 1 1 1 1 1 3 1 1 1\n1 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 4 4 4 4 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 4 4 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTest Input 2:\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 2 2 4 4 4 2 2 2 2 4 4 4 4 4 4 4 4 4 4\n4 4 2 4 4 2 2 2 4 4 2 2 4 4 4 3 3 3 3 3 3 4\n4 4 2 2 4 4 4 4 4 2 2 4 4 4 4 4 3 4 3 4 4 4\n4 4 4 2 4 2 2 2 4 2 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 2 2 2 4 2 2 2 2 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 1 1 1 4 4 1 1 1 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 1 4 1 1 1 1 4 1 4 4 4 4\n4 4 4 4 4 4 4 4 1 1 1 4 4 4 4 4 4 1 1 4 4 4\n4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4 4 1 4 4 4 4\n4 4 4 4 4 4 4 4 4 1 1 1 1 1 1 1 1 1 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 6, + 1, + 1, + 6, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 1, + 6, + 6, + 6, + 6, + 1, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 1, + 1, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 6, + 1, + 1, + 1, + 1, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 3, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1 + ], + [ + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ] + ], + [ + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 2, + 4, + 4, + 4, + 2, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 4, + 4, + 2, + 2, + 2, + 4, + 4, + 2, + 4, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 3, + 4, + 3, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 2, + 4, + 2, + 2, + 2, + 4, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 2, + 2, + 2, + 4, + 2, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 1, + 4, + 4, + 1, + 1, + 1, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 4, + 1, + 1, + 1, + 1, + 4, + 1, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_d8e07eb2", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 0 0 0 8 8 1 1 1 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 0 0 0 8 8 8 1 8 8 8 7 7 7 8 8 8 8 6 8 8\n8 8 0 0 0 8 8 1 1 1 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 0 0 0 3 3 1 1 1 3 3 7 3 3 3 3 3 6 6 3 3\n3 3 0 0 0 3 3 3 1 3 3 3 7 7 7 3 3 3 3 6 3 3\n3 3 0 0 0 3 3 1 1 1 3 3 7 3 3 3 3 3 6 6 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 8\n8 3 7 3 3 3 3 1 1 1 3 3 3 6 6 3 3 0 0 0 3 8\n8 3 7 7 7 3 3 3 1 3 3 3 3 3 6 3 3 0 0 0 3 8\n8 3 7 3 3 3 3 1 1 1 3 3 3 6 6 3 3 0 0 0 3 8\n8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n\nTraining Example 2:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 0 8 8 8 8 1 1 1 8 8 6 6 6 8 8 2 2 8 8 8\n8 8 0 0 0 8 8 8 1 8 8 8 6 8 6 8 8 2 2 2 8 8\n8 8 0 8 0 8 8 1 1 1 8 8 6 8 6 8 8 8 2 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 0 3 3 3 3 1 1 1 3 3 6 6 6 3 3 2 2 3 3 3\n3 3 0 0 0 3 3 3 1 3 3 3 6 3 6 3 3 2 2 2 3 3\n3 3 0 3 0 3 3 1 1 1 3 3 6 3 6 3 3 3 2 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 3 0 3 3 3 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 3 0 0 0 3 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 3 0 3 0 3 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 3 1 1 1 3 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 3 3 1 3 3 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 3 1 1 1 3 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 3 2 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 3 2 2 2 3 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 3 3 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 3 6 6 6 3 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 3 6 3 6 3 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 3 6 3 6 3 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n\nTraining Example 3:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 4 8 4 8 8 2 2 8 8 8 2 2 2 8 8\n8 8 8 2 8 8 8 4 8 4 8 8 2 2 2 8 8 2 8 2 8 8\n8 8 2 8 2 8 8 4 4 4 8 8 8 2 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 4 8 4 8 8 2 2 8 8 8 2 2 2 8 8\n8 8 8 2 8 8 8 4 8 4 8 8 2 2 2 8 8 2 8 2 8 8\n8 8 2 8 2 8 8 4 4 4 8 8 8 2 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 2 3 2 3 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 3 3 2 3 3 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 3 2 3 2 3 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 3 4 3 4 3 3 2 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 3 4 3 4 3 3 2 2 2 3 8 5 8 8 8 8 1 1 8 8 8\n8 3 4 4 4 3 3 3 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 3 3 3 3 3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 3 2 2 2 3 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 3 2 3 2 3 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 3 2 2 2 3 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nTraining Example 4:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 0 0 0 8 8 2 2 8 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 0 0 0 8 8 2 2 2 8 8 7 7 7 8 8 8 8 6 8 8\n8 8 0 0 0 8 8 8 2 8 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 0 0 0 8 8 2 2 8 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 0 0 0 8 8 2 2 2 8 8 7 7 7 8 8 8 8 6 8 8\n8 8 0 0 0 8 8 8 2 8 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 3 8 8 8 8 8 3 3 3 3 3 3 3 3 3 3 8\n8 3 7 3 3 3 8 1 1 1 8 3 3 6 6 3 3 0 0 0 3 8\n8 3 7 7 7 3 8 8 1 8 8 3 3 3 6 3 3 0 0 0 3 8\n8 3 7 3 3 3 8 1 1 1 8 3 3 6 6 3 3 0 0 0 3 8\n8 3 3 3 3 3 8 8 8 8 8 3 3 3 3 3 3 3 3 3 3 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 3 2 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 3 2 2 2 3 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 3 3 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nTraining Example 5:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 1 1 1 8 8 1 8 1 8 8 9 8 9 8 8 8 8 8 8 8\n8 8 8 1 8 8 8 1 1 8 8 8 9 9 8 8 8 8 8 8 8 8\n8 8 1 1 1 8 8 1 8 1 8 8 9 9 9 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 1 1 1 8 8 1 8 1 8 8 9 8 9 8 8 8 8 8 8 8\n8 8 8 1 8 8 8 1 1 8 8 8 9 9 8 8 8 8 8 8 8 8\n8 8 1 1 1 8 8 1 8 1 8 8 9 9 9 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 3 9 3 9 3 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 3 9 9 3 3 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 3 9 9 9 3 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 3 1 1 1 3 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 3 3 1 3 3 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 3 1 1 1 3 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 3 1 3 1 3 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 3 1 1 3 3 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 3 1 3 1 3 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nTest Input 1:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 0 0 0 8 8 1 8 1 8 8 9 8 9 8 8 2 2 2 8 8\n8 8 0 0 0 8 8 1 1 8 8 8 9 9 8 8 8 2 8 2 8 8\n8 8 0 0 0 8 8 1 8 1 8 8 9 9 9 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nTest Input 2:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 7 8 8 8 8 2 2 8 8 8 5 5 8 8 8\n8 8 8 2 8 8 8 7 7 7 8 8 2 2 2 8 8 5 8 8 8 8\n8 8 2 8 2 8 8 7 8 8 8 8 8 2 8 8 8 5 5 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 0, + 0, + 0, + 3, + 3, + 1, + 3, + 1, + 3, + 3, + 9, + 3, + 9, + 3, + 3, + 2, + 2, + 2, + 3, + 3 + ], + [ + 3, + 3, + 0, + 0, + 0, + 3, + 3, + 1, + 1, + 3, + 3, + 3, + 9, + 9, + 3, + 3, + 3, + 2, + 3, + 2, + 3, + 3 + ], + [ + 3, + 3, + 0, + 0, + 0, + 3, + 3, + 1, + 3, + 1, + 3, + 3, + 9, + 9, + 9, + 3, + 3, + 2, + 2, + 2, + 3, + 3 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 2, + 8, + 2, + 8, + 8, + 0, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 3, + 9, + 3, + 9, + 3, + 8 + ], + [ + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 0, + 0, + 0, + 8, + 8, + 8, + 8, + 7, + 8, + 3, + 9, + 9, + 3, + 3, + 8 + ], + [ + 8, + 8, + 2, + 8, + 2, + 8, + 8, + 0, + 8, + 0, + 8, + 8, + 7, + 7, + 7, + 8, + 3, + 9, + 9, + 9, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 1, + 1, + 1, + 8, + 8, + 8, + 6, + 6, + 8, + 3, + 0, + 0, + 0, + 3, + 8 + ], + [ + 8, + 8, + 7, + 7, + 7, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 3, + 0, + 0, + 0, + 3, + 8 + ], + [ + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 1, + 1, + 1, + 8, + 8, + 8, + 6, + 6, + 8, + 3, + 0, + 0, + 0, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 4, + 8, + 4, + 8, + 8, + 2, + 2, + 8, + 8, + 8, + 5, + 5, + 8, + 8, + 3, + 1, + 3, + 1, + 3, + 8 + ], + [ + 8, + 8, + 4, + 8, + 4, + 8, + 8, + 2, + 2, + 2, + 8, + 8, + 5, + 8, + 8, + 8, + 3, + 1, + 1, + 3, + 3, + 8 + ], + [ + 8, + 8, + 4, + 4, + 4, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 5, + 5, + 8, + 8, + 3, + 1, + 3, + 1, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 6, + 6, + 6, + 8, + 8, + 8, + 4, + 8, + 8, + 3, + 2, + 2, + 2, + 3, + 8 + ], + [ + 8, + 8, + 9, + 9, + 9, + 8, + 8, + 6, + 8, + 6, + 8, + 8, + 4, + 4, + 4, + 8, + 3, + 2, + 3, + 2, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 9, + 8, + 8, + 6, + 8, + 6, + 8, + 8, + 8, + 4, + 8, + 8, + 3, + 2, + 2, + 2, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ] + ], + [ + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 2, + 8, + 2, + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 2, + 2, + 8, + 8, + 8, + 5, + 5, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 7, + 7, + 7, + 8, + 8, + 2, + 2, + 2, + 8, + 8, + 5, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 2, + 8, + 2, + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 5, + 5, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 3, + 2, + 3, + 2, + 3, + 8, + 0, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 8, + 9, + 8, + 9, + 8, + 8 + ], + [ + 8, + 3, + 3, + 2, + 3, + 3, + 8, + 0, + 0, + 0, + 8, + 8, + 8, + 8, + 7, + 8, + 8, + 9, + 9, + 8, + 8, + 8 + ], + [ + 8, + 3, + 2, + 3, + 2, + 3, + 8, + 0, + 8, + 0, + 8, + 8, + 7, + 7, + 7, + 8, + 8, + 9, + 9, + 9, + 8, + 8 + ], + [ + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 3, + 7, + 3, + 3, + 3, + 8, + 1, + 1, + 1, + 8, + 8, + 8, + 6, + 6, + 8, + 8, + 0, + 0, + 0, + 8, + 8 + ], + [ + 8, + 3, + 7, + 7, + 7, + 3, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 0, + 0, + 0, + 8, + 8 + ], + [ + 8, + 3, + 7, + 3, + 3, + 3, + 8, + 1, + 1, + 1, + 8, + 8, + 8, + 6, + 6, + 8, + 8, + 0, + 0, + 0, + 8, + 8 + ], + [ + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 4, + 8, + 4, + 8, + 3, + 2, + 2, + 3, + 3, + 3, + 5, + 5, + 3, + 3, + 8, + 1, + 8, + 1, + 8, + 8 + ], + [ + 8, + 8, + 4, + 8, + 4, + 8, + 3, + 2, + 2, + 2, + 3, + 3, + 5, + 3, + 3, + 3, + 8, + 1, + 1, + 8, + 8, + 8 + ], + [ + 8, + 8, + 4, + 4, + 4, + 8, + 3, + 3, + 2, + 3, + 3, + 3, + 5, + 5, + 3, + 3, + 8, + 1, + 8, + 1, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 6, + 6, + 6, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 2, + 2, + 2, + 8, + 8 + ], + [ + 8, + 8, + 9, + 9, + 9, + 8, + 8, + 6, + 8, + 6, + 8, + 8, + 4, + 4, + 4, + 8, + 8, + 2, + 8, + 2, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 9, + 8, + 8, + 6, + 8, + 6, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 2, + 2, + 2, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_a25697e4", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 4 4 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 4 4 3 3 3 3 3 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n4 4 4 4 1 1 1 1 3 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 3 3 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTraining Example 2:\nInput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 4 4 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 4 4 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n3 3 3 3 1 1 1 1 4 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 3 3 4 4 4 4 4 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTraining Example 3:\nInput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 5 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 5 5 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 5 5 5 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 7 7 7 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 7 1 1 1 1 6 1 1 1 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 7 1 1 1 1 6 1 6 6 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 6 1 6 6 6 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 5 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 5 5 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 5 5 5 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 6 7 7 7 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 6 7 6 6 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 6 7 6 6 6 1 1 1 1 1 1 1 1 1\n\nTest Input 1:\n4 4 2 2 2 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 2 2 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 2 2 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 2 2 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 2 4 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 2 2\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4 4 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4 4 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4 4 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 4 3 3 3 3 3 1 1 1 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 3 1 1 1 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 1 4 3 3 3 3 3 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 1 1 3 3 3 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nTest Input 2:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 2 8 2 2 2 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 2 8 8 2 2 8 8 8\n8 8 8 8 8 8 8 8 8 4 6 6 8 8 8 8 2 2 8 8 8 2 8 8 8\n8 8 8 8 8 8 4 4 4 4 6 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 6 6 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 7 7 7 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 3 3 7 7 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 3 8 7 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 4, + 4, + 2, + 2, + 2, + 3, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 2, + 3, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 2, + 3, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 2, + 3, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 3, + 3, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 4, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 3, + 1, + 1, + 1, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 4, + 1, + 1, + 1, + 1, + 1 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ] + ], + [ + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 2, + 7, + 2, + 2, + 2, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 2, + 7, + 7, + 2, + 2, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 2, + 7, + 7, + 7, + 2, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 6, + 3, + 3, + 3, + 3 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 4, + 4, + 4, + 4 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 6, + 4, + 3, + 3, + 3 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_71e489b6", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n1 1 1 0 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 0 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 0 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 0 0 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 1 0 0 0 0 0 0 0 0\n0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 7 0 7 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 7 7 7 1 1 1 1 1 1 1 1 1 1 7 7\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 7 0\n1 1 1 1 1 1 1 7 7 7 1 1 1 1 1 7 7\n1 1 1 1 1 1 1 7 0 7 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 7 7 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 7 7 0 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 7 0 0 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 7 7 7 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 7 7 7 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 7 0 7 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 7 7 7 1\n\nTraining Example 2:\nInput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 1 0 0 0 1 1 1 1 1 1 0 1 1 1\n1 1 0 0 0 0 1 1 1 1 1 1 0 1 0 1\n1 1 0 0 0 0 1 1 0 1 1 1 0 1 1 1\n1 1 0 0 1 0 1 1 1 1 1 1 0 1 1 0\n1 1 0 0 0 0 1 1 1 1 1 1 0 1 1 1\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 0 0 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 7 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 7 7\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 0 0 0 0 1 1 1 1 1 1 0 7 7 7\n1 1 0 0 0 0 1 7 7 7 1 1 0 7 0 7\n1 1 0 0 0 0 1 7 0 7 1 1 0 7 7 7\n1 1 0 0 0 0 1 7 7 7 1 1 0 1 7 0\n1 1 0 0 0 0 1 1 1 1 1 1 0 1 7 7\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 7 7 7 7 1 1 1 1 1 1 1\n1 1 1 1 1 7 0 0 7 1 1 1 1 1 1 1\n1 1 1 1 1 7 7 7 7 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTraining Example 3:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 1\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 0 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 0 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 0 1 1 1 1 1 1 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 7 7 7 1 1 0 0\n0 0 0 0 1 1 1 1 1 7 0 7 7 1 0 0\n0 0 0 0 1 1 1 1 1 7 7 0 7 1 0 0\n0 0 0 0 1 1 1 1 1 1 7 7 7 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 7 7 7 1 1 1 1 1 0 0\n0 0 0 0 1 1 7 0 7 1 1 1 1 1 0 0\n0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTest Input 1:\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 1 0 1 1 0 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1\n1 1 1 1 1 0 1 1 1 1 1 1 1 1 0 0\n1 1 1 1 0 1 1 1 1 1 1 1 1 1 0 1\n1 1 1 0 1 1 1 1 1 1 1 1 1 1 0 0\n1 1 1 1 1 1 1 1 1 1 1 0 1 1 0 0\n1 1 1 1 1 1 1 1 1 1 1 0 1 1 1 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 0\n1 1 1 1 1 1 0 1 1 1 1 1 1 1 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 1 0 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 1\n\nTest Input 2:\n0 0 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 1 1 0 1 1 1 1 1 1 1 1 1 1 1 0 1 1\n0 0 1 1 1 1 1 1 1 0 0 0 0 0 0 0 0 0 0\n0 0 1 1 1 1 0 1 1 0 0 0 0 1 0 0 0 0 0\n0 0 1 1 1 1 1 1 1 0 0 0 0 0 0 0 0 0 0\n1 0 1 1 1 1 1 1 1 0 0 1 1 1 1 1 1 1 1\n0 0 1 1 1 1 1 1 1 0 0 1 1 1 1 1 1 1 1\n0 0 1 1 1 0 1 1 1 0 0 1 1 1 1 1 1 1 1\n0 0 1 1 0 1 0 1 1 0 0 1 1 1 0 1 1 1 1\n0 0 1 1 1 1 1 1 1 0 0 1 1 1 0 1 1 1 1\n0 0 1 1 1 1 1 1 1 0 0 1 1 1 1 1 1 1 1\n0 0 1 1 1 1 1 1 1 0 0 1 1 1 1 1 1 1 1\n0 0 0 1 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 1 0 0 1 1 1 1 1 1 1 0\n0 0 0 0 0 0 0 0 0 0 0 1 0 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 1 1 0 1 1 1 1 1\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 1, + 7, + 7, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 7, + 7, + 0, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0 + ], + [ + 1, + 1, + 7, + 7, + 0, + 7, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0 + ], + [ + 1, + 1, + 7, + 0, + 7, + 7, + 1, + 1, + 1, + 1, + 7, + 7, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 7, + 7, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 7, + 7, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 7, + 7, + 1 + ], + [ + 0, + 0, + 1, + 7, + 0, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 1 + ], + [ + 0, + 0, + 1, + 7, + 7, + 7, + 7, + 7, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0 + ], + [ + 0, + 0, + 1, + 1, + 1, + 7, + 0, + 7, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 1, + 1, + 7, + 7, + 7, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 7, + 7, + 0, + 7, + 7, + 1, + 0, + 0, + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 7, + 0, + 7, + 0, + 7, + 1, + 0, + 0, + 1, + 1, + 7, + 0, + 7, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 7, + 7, + 7, + 7, + 7, + 1, + 0, + 0, + 1, + 1, + 7, + 0, + 7, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 1, + 1, + 1, + 7, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 7, + 7, + 1, + 1, + 7, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 0, + 7, + 1, + 1, + 1, + 1 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + }, + { + "problem_id": "arc2_446ef5d2", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 7 7 7\n8 8 8 8 8 8 8 8 8 7 7 7 7 7 7 8 8 2 2 2\n8 8 8 8 8 8 8 8 8 0 0 0 7 0 7 8 8 7 7 7\n8 8 8 8 8 8 8 8 8 0 7 0 0 0 7 8 8 7 7 7\n8 7 7 7 7 7 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 7 0 0 0 0 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 7 0 7 0 0 8 8 8 8 8 8 8 8 8 7 7 7 8 8\n8 7 7 7 7 7 8 8 8 8 8 8 8 8 8 2 2 7 8 8\n8 7 2 7 2 2 8 8 8 8 8 8 8 8 8 7 2 7 8 8\n8 7 2 2 2 7 8 8 8 8 8 8 8 8 8 7 7 7 4 8\n8 7 7 7 7 7 8 8 8 8 8 8 8 8 8 8 8 4 4 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 8 8\n8 8 8 8 8 8 8 7 0 0 0 0 0 0 0 7 0 7 8 8\n8 8 8 8 8 8 8 7 0 7 0 0 0 7 0 0 0 7 8 8\n8 8 8 8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 8 8\n8 8 8 8 8 8 8 7 2 7 2 2 2 2 2 2 2 7 8 8\n8 8 8 8 8 8 8 7 2 2 2 7 7 7 7 7 2 7 8 8\n8 8 8 8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nTraining Example 2:\nInput:\n8 8 8 8 8 8 8 8 8 8\n8 4 4 8 8 8 9 9 3 8\n8 4 3 3 3 8 3 3 3 8\n8 8 3 9 9 8 3 3 3 8\n8 8 3 9 9 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8\n8 3 3 3 8 8 3 9 9 8\n8 9 9 3 8 8 3 9 3 8\n8 9 9 3 8 8 3 3 3 8\n8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8\n8 8 3 3 3 3 3 3 8 8\n8 8 3 9 9 9 9 3 8 8\n8 8 3 9 9 9 9 3 8 8\n8 8 3 9 9 9 9 3 8 8\n8 8 3 9 3 3 3 3 8 8\n8 8 3 3 3 3 3 3 8 8\n8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8\n\nTest Input 1:\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 4 1 1 1\n4 1 3 1 1 4 4 4 4 4 4 4 4 4 4 4 4 4 1 3 3 3 4 6 6 1\n4 1 3 3 3 4 4 4 4 4 4 4 4 4 4 4 4 4 1 3 1 1 4 1 6 1\n4 1 1 1 1 4 4 4 4 4 4 4 4 4 4 4 4 4 1 3 1 1 4 1 6 1\n4 1 1 1 1 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 6 6 1\n4 1 1 6 6 4 1 1 1 1 3 1 4 4 4 4 1 1 7 1 1 1 4 1 1 1\n4 1 1 6 1 4 3 3 3 3 3 1 4 4 4 4 1 1 7 1 1 1 4 4 4 4\n4 4 4 4 4 4 1 1 1 1 1 1 4 4 4 4 7 7 7 1 1 1 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 1 1 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 1 1 4 4 4 4\n1 1 1 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n1 1 1 4 4 4 4 1 1 1 1 1 1 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 1 1 4 4 4 4 3 3 3 3 3 1 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 6 6 4 4 4 4 1 1 1 1 3 1 4 4 4 4 4 4 4 1 1 1 1 1 1\n4 1 1 4 4 4 4 1 1 1 1 3 1 4 1 1 6 1 1 4 7 7 7 1 1 1\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 6 6 6 4 1 1 7 1 1 1\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 1 4 1 1 7 1 1 1\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 4 4 4 4 4 4 4 4\n4 4 1 7 1 1 4 4 4 4 4 4 4 4 1 7 7 7 4 4 4 4 4 4 4 4\n4 4 1 7 7 7 4 4 4 4 4 4 4 4 1 7 1 1 4 4 4 4 4 4 4 4\n4 4 1 1 1 1 4 4 4 4 4 4 4 4 1 7 1 1 4 4 4 4 4 4 4 4\n4 2 1 1 1 1 4 4 4 4 4 4 4 4 1 7 1 1 4 4 4 4 4 4 4 4\n4 2 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nTest Input 2:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 9 9 9 9 8 8 8 8 8 8 8 4 4 8\n8 8 8 8 8 8 3 3 9 9 8 8 8 8 8 9 9 9 4 8\n9 9 9 8 8 8 9 3 9 9 8 8 8 8 8 9 3 9 8 8\n9 3 3 8 8 8 3 3 3 3 8 8 8 8 8 3 3 9 8 8\n9 3 9 8 8 8 9 3 3 3 8 8 8 8 8 3 3 9 8 8\n9 3 3 8 8 8 3 3 9 9 8 8 8 8 8 8 8 8 8 8\n9 3 9 8 8 8 9 9 9 9 8 8 8 8 8 8 8 8 8 8\n9 3 3 8 8 8 8 8 8 8 8 8 8 9 9 9 8 8 8 8\n9 9 9 8 8 8 8 8 8 8 8 8 8 9 9 9 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 9 3 3 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 9 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 9 8 8 8 8\n8 8 8 9 9 9 8 8 8 8 8 8 8 9 3 3 8 8 8 8\n8 8 8 9 3 9 8 8 8 8 8 8 8 9 9 9 8 8 8 8\n8 8 8 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 9 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 9 3 3 8 8 8 8 8 3 3 9 8 8 8 8 8 8\n8 8 8 3 3 3 8 8 8 8 8 3 3 9 8 8 8 8 8 8\n8 8 8 9 9 9 8 8 8 8 8 9 9 9 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 7, + 7, + 7, + 7, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 1, + 1, + 1, + 1, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 1, + 1, + 1, + 1, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 1, + 1, + 1, + 1, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 1, + 1, + 1, + 1, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 7, + 7, + 7, + 7, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ] + ], + [ + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 3, + 3, + 3, + 9, + 9, + 9, + 9, + 9, + 9, + 3, + 9, + 9, + 3, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 9, + 9, + 3, + 9, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 3, + 3, + 3, + 3, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 3, + 3, + 3, + 3, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 3, + 3, + 3, + 9, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ] + ] + ], + "num_test_pairs": 2, + "topic": "arc", + "source": "ARC2-Eval" + } +] \ No newline at end of file diff --git a/arc/arc_problems.py b/arc/arc_problems.py new file mode 100644 index 0000000..0c3228c --- /dev/null +++ b/arc/arc_problems.py @@ -0,0 +1,197 @@ +# Author: Claude Sonnet 4.6 +# Date: 30-March-2026 +# PURPOSE: ARC Problem Generator for AmnesiaBench. Fetches ARC puzzle tasks from +# the public API (arc.markbarney.net), formats them as AmnesiaBench-compatible +# problem JSON with space-separated numeric grids, and saves to arc_problems.json. +# Handles 15 unsolved tasks (1 ARC1-Eval + 14 ARC2-Eval) and 8 hardest solved +# ARC2-Eval tasks (23 tasks = 23 problems). All test pairs are included in each +# problem — model must solve ALL test pairs correctly for the task to count as solved. +# No external dependencies beyond stdlib. +# SRP/DRY check: Pass — single responsibility (fetch + format ARC tasks), grid formatting +# extracted to helper function, no duplication. + +from __future__ import annotations + +import json +import sys +import time +import urllib.request +import urllib.error + + +# ── Task Definitions ────────────────────────────────────────────────────────── + +UNSOLVED_ARC1_EVAL = ["50f325b5"] + +UNSOLVED_ARC2_EVAL = [ + "62593bfd", "2b83f449", "88bcf3b4", "8b7bacbf", "faa9f03d", + "269e22fb", "4e34c42c", "21897d95", "abc82100", "9bbf930d", + "a32d8b75", "e12f9a14", "13e47133", "88e364bc", +] + +HARDEST_SOLVED_ARC2_EVAL = [ + "e3721c99", "5dbc8537", "d35bdbdc", "8e5c0c38", + "d8e07eb2", "a25697e4", "71e489b6", "446ef5d2", +] + +API_BASE = "https://arc.markbarney.net/api/puzzle/task" + + +# ── Helpers ─────────────────────────────────────────────────────────────────── + +def grid_to_text(grid: list[list[int]]) -> str: + """Convert a 2D int grid to space-separated rows.""" + return "\n".join(" ".join(str(cell) for cell in row) for row in grid) + + +def estimate_tokens(text: str) -> int: + """Rough token estimate: ~4 chars per token for English text.""" + return len(text) // 4 + + +def fetch_task(task_id: str, retries: int = 3) -> dict: + """Fetch a single ARC task from the API with retry logic.""" + url = f"{API_BASE}/{task_id}" + for attempt in range(retries): + try: + req = urllib.request.Request(url, headers={"User-Agent": "AmnesiaBench/1.0"}) + with urllib.request.urlopen(req, timeout=30) as resp: + data = json.loads(resp.read().decode("utf-8")) + if not data.get("success"): + raise ValueError(f"API returned success=false for {task_id}") + return data["data"] + except (urllib.error.URLError, urllib.error.HTTPError, ValueError) as e: + if attempt < retries - 1: + wait = 2 ** attempt + print(f" Retry {attempt + 1}/{retries} for {task_id} after {wait}s: {e}") + time.sleep(wait) + else: + raise RuntimeError(f"Failed to fetch {task_id} after {retries} attempts: {e}") + + +def build_problem_text(train_pairs: list[dict], test_pairs: list[dict]) -> str: + """Build the full problem text with training examples and ALL test inputs. + + All test pairs are presented together. The model must solve each one. + For single-test tasks, phrasing is singular. For multi-test, each is numbered. + """ + parts = [] + + if len(test_pairs) == 1: + parts.append("ARC Puzzle: Predict the test output grid.") + else: + parts.append(f"ARC Puzzle: Predict the output grid for each of the {len(test_pairs)} test inputs.") + + for i, pair in enumerate(train_pairs, 1): + parts.append(f"\nTraining Example {i}:") + parts.append(f"Input:\n{grid_to_text(pair['input'])}") + parts.append(f"\nOutput:\n{grid_to_text(pair['output'])}") + + if len(test_pairs) == 1: + parts.append(f"\nTest Input:\n{grid_to_text(test_pairs[0]['input'])}") + parts.append("\nGive your answer in ... tags, space-separated values, one row per line.") + else: + for t_idx, test_pair in enumerate(test_pairs, 1): + parts.append(f"\nTest Input {t_idx}:\n{grid_to_text(test_pair['input'])}") + parts.append(f"\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.") + parts.append("Use space-separated values, one row per line.") + + return "\n".join(parts) + + +def determine_source(task_id: str) -> str: + """Determine the source label for a task ID.""" + if task_id in UNSOLVED_ARC1_EVAL: + return "ARC1-Eval" + return "ARC2-Eval" + + +def determine_problem_id(task_id: str) -> str: + """Generate problem_id with appropriate prefix.""" + if task_id in UNSOLVED_ARC1_EVAL: + return f"arc1_{task_id}" + return f"arc2_{task_id}" + + +def build_problem(task_id: str, task_data: dict) -> dict: + """Build a single AmnesiaBench problem dict from fetched task data. + + All test pairs are included in one problem. ground_truth is a list of grids + (one per test pair). Model must solve ALL test pairs correctly = task solved. + """ + train_pairs = task_data["train"] + test_pairs = task_data["test"] + + problem_text = build_problem_text(train_pairs, test_pairs) + + # ground_truth: list of 2D grids (one per test pair) + # Single test pair: still a list with one element for consistency + ground_truth = [tp["output"] for tp in test_pairs] + + return { + "problem_id": determine_problem_id(task_id), + "problem_text": problem_text, + "ground_truth": ground_truth, + "num_test_pairs": len(test_pairs), + "topic": "arc", + "source": determine_source(task_id), + } + + +# ── Main ────────────────────────────────────────────────────────────────────── + +def main(): + all_task_ids = UNSOLVED_ARC1_EVAL + UNSOLVED_ARC2_EVAL + HARDEST_SOLVED_ARC2_EVAL + problems = [] + total_tokens = 0 + grid_sizes = [] + + print(f"Fetching {len(all_task_ids)} ARC tasks from {API_BASE}...") + print() + + for i, task_id in enumerate(all_task_ids, 1): + source = determine_source(task_id) + print(f" [{i:2d}/{len(all_task_ids)}] {task_id} ({source})...", end=" ", flush=True) + + task_data = fetch_task(task_id) + problem = build_problem(task_id, task_data) + problems.append(problem) + + # Stats + n_pairs = problem["num_test_pairs"] + pair_info = [] + for gt in problem["ground_truth"]: + rows, cols = len(gt), len(gt[0]) if gt else 0 + grid_sizes.append((rows, cols)) + pair_info.append(f"{rows}x{cols}") + tokens = estimate_tokens(problem["problem_text"]) + total_tokens += tokens + + grids_str = ", ".join(pair_info) + print(f"OK — {n_pairs} test pair{'s' if n_pairs > 1 else ''} ({grids_str}), ~{tokens} tokens") + + # Be polite to the API + if i < len(all_task_ids): + time.sleep(0.3) + + # Save + output_path = "arc_problems.json" + with open(output_path, "w") as f: + json.dump(problems, f, indent=2) + + # Summary + print() + print("=" * 60) + print(f" Problems generated: {len(problems)}") + print(f" ARC1-Eval: {sum(1 for p in problems if p['source'] == 'ARC1-Eval')}") + print(f" ARC2-Eval: {sum(1 for p in problems if p['source'] == 'ARC2-Eval')}") + print(f" Grid sizes: {min(r for r, c in grid_sizes)}x{min(c for r, c in grid_sizes)} " + f"to {max(r for r, c in grid_sizes)}x{max(c for r, c in grid_sizes)}") + print(f" Total token est: ~{total_tokens:,}") + print(f" Avg tokens/problem: ~{total_tokens // len(problems):,}") + print(f" Saved to: {output_path}") + print("=" * 60) + + +if __name__ == "__main__": + main() diff --git a/arc/arc_prompts.py b/arc/arc_prompts.py new file mode 100644 index 0000000..519f0b4 --- /dev/null +++ b/arc/arc_prompts.py @@ -0,0 +1,69 @@ +# Author: Claude Sonnet 4.6 +# Date: 30-March-2026 +# PURPOSE: ARC system prompts for AmnesiaBench. Two variants for A/B testing: +# SIMPLE — minimal, lets the model think on its own. +# GUIDED — teaches concrete solving strategies from arc-explainer. +# Both go in the system message; problem_text goes in the user message. +# SRP/DRY check: Pass — prompt definitions only, no generation or evaluation logic. + +from __future__ import annotations + +# ── SIMPLE — Son's preferred version ────────────────────────────────────────── +# +# Minimal instruction. Explains what grids are and what the task is. +# Lets the model use its own reasoning approach. + +ARC_SYSTEM_PROMPT_SIMPLE = """You are solving a pattern transformation puzzle. + +You will see grids of numbers (0-9). Each number represents a different colored element. Training examples show input grids and their corresponding output grids. Every training example follows the SAME deterministic transformation rule. + +Your job is to discover this rule and apply it to the test input(s) to predict the correct output grid(s). The rule must explain ALL training examples — if your hypothesis fails on any example, revise it. + +Give each answer inside numbered tags: for test 1, for test 2, etc. Use space-separated values, one row per line.""" + + +# ── GUIDED — Mark's preferred version ──────────────────────────────────────── +# +# Teaches 7 concrete strategies derived from arc-explainer's GEPA mode, +# visual solver, and basePrompts.ts. For models with limited or no ARC +# training data that need scaffolding on how to approach these puzzles. + +ARC_SYSTEM_PROMPT_GUIDED = """You are solving a pattern transformation puzzle. + +You will see grids of numbers (0-9). Each number represents a different colored element. Training examples show input grids and their corresponding output grids. Every training example follows the SAME deterministic transformation rule. Your job is to discover this rule and apply it to the test input(s) to predict the correct output grid(s). + +Approach the puzzle systematically: + +1. START SIMPLE. Check for global transformations first: rotation, reflection, transposition, uniform color replacement, cropping, or scaling. Many puzzles have surprisingly simple rules. + +2. LOOK FOR STRUCTURE. Check if rows or columns of a single value divide the grid into sections. The transformation may apply independently to each section. + +3. IDENTIFY OBJECTS. Group connected cells of the same non-zero value into objects. Track how objects change between input and output: do they move, change color, change shape, grow, shrink, duplicate, or disappear? + +4. FIND MARKERS. Look for cells with unique values or positions that might define where or how a transformation applies — like anchor points, corners of a region, or signals that trigger a specific operation. + +5. CONSIDER COMPOSITION. The transformation may require multiple steps applied in sequence. One operation may need to happen before another makes sense. Try decomposing complex changes into simpler sub-rules applied in order. + +6. VERIFY ACROSS ALL EXAMPLES. The rule MUST explain every training example, not just one. If your hypothesis fails on any example, it is wrong — revise it. Do not fixate on patterns that only appear in a single example. + +7. IGNORE NOISE. Some properties may vary between examples without being part of the rule. If something is not consistent across all input-output pairs, it is not relevant to the transformation. + +Give each answer inside numbered tags: for test 1, for test 2, etc. Use space-separated values, one row per line.""" + + +# ── Default alias ───────────────────────────────────────────────────────────── + +ARC_SYSTEM_PROMPT = ARC_SYSTEM_PROMPT_SIMPLE + + +if __name__ == "__main__": + print("ARC System Prompts — A/B Variants") + print("=" * 60) + print(f"SIMPLE: {len(ARC_SYSTEM_PROMPT_SIMPLE)} chars, ~{len(ARC_SYSTEM_PROMPT_SIMPLE) // 4} tokens") + print(f"GUIDED: {len(ARC_SYSTEM_PROMPT_GUIDED)} chars, ~{len(ARC_SYSTEM_PROMPT_GUIDED) // 4} tokens") + print() + print("--- SIMPLE ---") + print(ARC_SYSTEM_PROMPT_SIMPLE) + print() + print("--- GUIDED ---") + print(ARC_SYSTEM_PROMPT_GUIDED) diff --git a/flatten_arc_problems.py b/flatten_arc_problems.py new file mode 100644 index 0000000..11ddd6f --- /dev/null +++ b/flatten_arc_problems.py @@ -0,0 +1,43 @@ +#!/usr/bin/env python3 +# Author: Claude Opus 4.6 (Bubba subagent) +# Date: 30-March-2026 +# PURPOSE: Flatten arc/arc_problems.json into individual problem files in problems/, +# matching the AIMO3 format so the runner discovers them alongside math problems. +# SRP/DRY check: Pass — single script, reads one file, writes N files, no duplication. + +import json +from pathlib import Path + +ARC_PROBLEMS = Path(__file__).parent / "arc" / "arc_problems.json" +PROBLEMS_DIR = Path(__file__).parent / "problems" + + +def main(): + with open(ARC_PROBLEMS) as f: + problems = json.load(f) + + print(f"Read {len(problems)} ARC problems from {ARC_PROBLEMS}") + + PROBLEMS_DIR.mkdir(exist_ok=True) + + written = 0 + for p in problems: + pid = p["problem_id"] + out = { + "problem_id": pid, + "problem_text": p["problem_text"], + "ground_truth": p["ground_truth"], + "topic": "arc", + "source": "ARC1-Eval", + } + outpath = PROBLEMS_DIR / f"{pid}.json" + outpath.write_text(json.dumps(out, indent=2)) + written += 1 + print(f" Wrote {outpath.name}") + + print(f"\nDone: {written} ARC problem files written to {PROBLEMS_DIR}") + print(f"Total files in problems/: {len(list(PROBLEMS_DIR.glob('*.json')))}") + + +if __name__ == "__main__": + main() diff --git a/models.json b/models.json new file mode 100644 index 0000000..56ceb12 --- /dev/null +++ b/models.json @@ -0,0 +1,13 @@ +[ + {"name": "qwen/qwen3.6-plus-preview", "url": "openrouter://qwen/qwen3.6-plus-preview:free", "api_key_env": "OPENROUTER_API_KEY"}, + {"name": "nvidia/nemotron-3-super-120b", "url": "openrouter://nvidia/nemotron-3-super-120b-a12b:free", "api_key_env": "OPENROUTER_API_KEY"}, + {"name": "z-ai/glm-4.5-air", "url": "openrouter://z-ai/glm-4.5-air:free", "api_key_env": "OPENROUTER_API_KEY"}, + {"name": "arcee-ai/trinity-large-preview", "url": "openrouter://arcee-ai/trinity-large-preview:free", "api_key_env": "OPENROUTER_API_KEY"}, + {"name": "qwen/qwen3-coder", "url": "openrouter://qwen/qwen3-coder:free", "api_key_env": "OPENROUTER_API_KEY"}, + {"name": "stepfun/step-3.5-flash", "url": "openrouter://stepfun/step-3.5-flash:free", "api_key_env": "OPENROUTER_API_KEY"}, + {"name": "minimax/minimax-m2.5", "url": "openrouter://minimax/minimax-m2.5:free", "api_key_env": "OPENROUTER_API_KEY"}, + {"name": "gemini-3.1-flash-lite-preview", "url": "gemini://gemini-3.1-flash-lite-preview", "api_key_env": "GEMINI_API_KEY"}, + {"name": "mistral-small-2603", "url": "openrouter://mistralai/mistral-small-2603", "api_key_env": "OPENROUTER_API_KEY"}, + {"name": "claude-sonnet-4.6", "url": "anthropic://claude-sonnet-4-6", "api_key_env": "ANTHROPIC_OAUTHTOKEN"}, + {"name": "deepseek-v3.2", "url": "openrouter://deepseek/deepseek-chat-v3-0324", "api_key_env": "OPENROUTER_API_KEY"} +] diff --git a/problems/aimo3_hard_00eaa992.json b/problems/aimo3_hard_00eaa992.json new file mode 100644 index 0000000..6e1cbeb --- /dev/null +++ b/problems/aimo3_hard_00eaa992.json @@ -0,0 +1,10 @@ +{ + "problem_id": "aimo3_hard_00eaa992", + "problem_text": "If \\((60-a)(60-b)(60-c)(60-d)(60-e) = 1025\\), what is the value of \\(a + b + c + d\\)?\n\nNote: 1025 is divisible by 5.", + "ground_truth": "188", + "topic": "number_theory", + "source": "aimo3_hard", + "gptoss_20b_pass_rate": 0.125, + "gptoss_20b_n_correct": 2, + "gptoss_20b_correct_token_avg": null +} \ No newline at end of file diff --git a/problems/aimo3_hard_2e0b7ba3.json b/problems/aimo3_hard_2e0b7ba3.json new file mode 100644 index 0000000..faa1763 --- /dev/null +++ b/problems/aimo3_hard_2e0b7ba3.json @@ -0,0 +1,10 @@ +{ + "problem_id": "aimo3_hard_2e0b7ba3", + "problem_text": "How many ways are there to paint the first level of the Th\u00e1p R\u00f9a tower model, given that the $3$ doorways at the front are painted with the same color and each of the remaining $7$ doorways is painted with one of the three colors such that any two adjacent doorways with a common side on the same level are painted with different colors?", + "ground_truth": "216", + "topic": "combinatorics", + "source": "aimo3_hard", + "gptoss_20b_pass_rate": 0.125, + "gptoss_20b_n_correct": 2, + "gptoss_20b_correct_token_avg": null +} \ No newline at end of file diff --git a/problems/aimo3_hard_5f9595ae.json b/problems/aimo3_hard_5f9595ae.json new file mode 100644 index 0000000..973d181 --- /dev/null +++ b/problems/aimo3_hard_5f9595ae.json @@ -0,0 +1,10 @@ +{ + "problem_id": "aimo3_hard_5f9595ae", + "problem_text": "In an acute triangle \\(ABC\\) with \\(\\angle A = 30^\\circ\\), a circle with diameter \\(BC\\) intersects \\(AB\\) and \\(AC\\) at points \\(D\\) and \\(E\\), respectively. Find the ratio of the area of \\(\\triangle ADC\\) to the area of quadrilateral \\(DBCE\\).", + "ground_truth": "3", + "topic": "geometry", + "source": "aimo3_hard", + "gptoss_20b_pass_rate": 0.125, + "gptoss_20b_n_correct": 2, + "gptoss_20b_correct_token_avg": null +} \ No newline at end of file diff --git a/problems/aimo3_hard_858cba58.json b/problems/aimo3_hard_858cba58.json new file mode 100644 index 0000000..9c7bd09 --- /dev/null +++ b/problems/aimo3_hard_858cba58.json @@ -0,0 +1,10 @@ +{ + "problem_id": "aimo3_hard_858cba58", + "problem_text": "All vertices of a pyramid lie on the facets of a cube but not on its edges, and each facet contains at least one vertex. What is the maximum possible number of the vertices of the pyramid?", + "ground_truth": "13", + "topic": "other", + "source": "aimo3_hard", + "gptoss_20b_pass_rate": 0.125, + "gptoss_20b_n_correct": 2, + "gptoss_20b_correct_token_avg": null +} \ No newline at end of file diff --git a/problems/aimo3_hard_b0dc264b.json b/problems/aimo3_hard_b0dc264b.json new file mode 100644 index 0000000..22a7c54 --- /dev/null +++ b/problems/aimo3_hard_b0dc264b.json @@ -0,0 +1,10 @@ +{ + "problem_id": "aimo3_hard_b0dc264b", + "problem_text": "Given the group $(G, *)$ with $G = \\{a, b, c, d, f, g, h, k\\}$ and identity $k$, and the following operations:\n- $a * b = c$\n- $b * a = d$\n- $f * f = a$\n- $g * g = b$\n- $h * h = c$\n\nHow many self-inverses does $(G, *)$ have?", + "ground_truth": "2", + "topic": "other", + "source": "aimo3_hard", + "gptoss_20b_pass_rate": 0.125, + "gptoss_20b_n_correct": 2, + "gptoss_20b_correct_token_avg": null +} \ No newline at end of file diff --git a/problems/aimo3_hard_b1da52fa.json b/problems/aimo3_hard_b1da52fa.json new file mode 100644 index 0000000..2f7683a --- /dev/null +++ b/problems/aimo3_hard_b1da52fa.json @@ -0,0 +1,10 @@ +{ + "problem_id": "aimo3_hard_b1da52fa", + "problem_text": "Drunk and Horse play a game on a $2023! \\times 2023!$ grid. Horse chooses a positive integer $k < 2023$ and lights up each square using $k$ different colors. Horse starts on a random square, and Drunk starts on another square exactly $2023^2$ squares away in one direction. In each turn, Drunk moves one square in some direction but cannot move in the same direction for 2023 consecutive moves. Horse moves up to $m$ squares in a direction of its choice, where $m = 2023 - k$. Horse gets alerted of the color of the square Drunk was previously on. Horse wins if it ends up on a square that shares at least one vertex with Drunk's square. What is the minimum number of turns in which Horse can guarantee a win?", + "ground_truth": "2030", + "topic": "combinatorics", + "source": "aimo3_hard", + "gptoss_20b_pass_rate": 0.125, + "gptoss_20b_n_correct": 2, + "gptoss_20b_correct_token_avg": null +} \ No newline at end of file diff --git a/problems/aimo3_hard_f728b4b1.json b/problems/aimo3_hard_f728b4b1.json new file mode 100644 index 0000000..25e7e94 --- /dev/null +++ b/problems/aimo3_hard_f728b4b1.json @@ -0,0 +1,10 @@ +{ + "problem_id": "aimo3_hard_f728b4b1", + "problem_text": "Triangle $ABC$ is constructed such that $AB>BC>AC$. Points $E$, $F$, and $G$ are drawn from $A$, $B$, and $C$ to their opposite sides respectively. If $\\frac{BE}{EC} = \\frac{7}{12}$, the ratio of $\\frac{AF}{FC}$ can be represented as $\\frac{m}{n}$, where $m$ and $n$ are relatively prime positive integers. What is the smallest possible sum of $m+n$?", + "ground_truth": "26", + "topic": "geometry", + "source": "aimo3_hard", + "gptoss_20b_pass_rate": 0.125, + "gptoss_20b_n_correct": 2, + "gptoss_20b_correct_token_avg": null +} \ No newline at end of file diff --git a/problems/arc1_50f325b5.json b/problems/arc1_50f325b5.json new file mode 100644 index 0000000..2443ecd --- /dev/null +++ b/problems/arc1_50f325b5.json @@ -0,0 +1,314 @@ +{ + "problem_id": "arc1_50f325b5", + "problem_text": "ARC Puzzle: Predict the test output grid.\n\nTraining Example 1:\nInput:\n2 2 0 7 0 3 2 7 0 2 7 0 3 2 7 0 0 3\n2 2 0 0 2 3 3 4 0 0 7 0 0 0 0 0 0 7\n4 2 7 2 7 0 4 0 0 7 2 0 3 0 7 3 2 0\n3 7 2 2 7 0 0 3 0 2 4 0 2 4 0 4 3 3\n2 4 3 2 0 4 3 2 3 2 0 0 8 8 8 7 0 2\n2 7 3 2 7 0 0 2 3 3 3 7 0 8 2 2 2 0\n0 2 2 2 0 3 2 7 3 3 7 0 0 8 0 0 0 0\n4 2 7 3 0 3 0 7 2 7 2 0 4 2 7 7 0 0\n0 0 2 0 2 0 4 7 4 0 0 2 2 2 3 3 3 0\n2 0 4 7 0 7 0 3 2 4 2 0 0 2 0 0 2 7\n7 4 2 7 4 3 3 7 2 2 0 0 7 7 0 7 0 4\n\nOutput:\n2 2 0 7 0 3 2 7 0 2 7 0 3 2 7 0 0 3\n2 2 0 0 2 3 3 4 0 0 7 0 0 0 0 0 0 7\n4 2 7 2 7 0 4 0 0 7 2 0 3 0 7 3 2 0\n3 7 2 2 7 0 0 3 0 2 4 0 2 4 0 4 3 3\n2 4 3 2 0 4 3 2 8 2 0 0 8 8 8 7 0 2\n2 7 3 2 7 0 0 2 8 8 8 7 0 8 2 2 2 0\n0 2 2 2 0 3 2 7 8 3 7 0 0 8 0 0 0 0\n4 2 7 3 0 3 0 7 2 7 2 0 4 2 7 7 0 0\n0 0 2 0 2 0 4 7 4 0 0 2 2 2 3 3 3 0\n2 0 4 7 0 7 0 3 2 4 2 0 0 2 0 0 2 7\n7 4 2 7 4 3 3 7 2 2 0 0 7 7 0 7 0 4\n\nTraining Example 2:\nInput:\n2 7 7 0 0 3 3 2 2 0 0 2 3 3 7 0 0\n0 3 7 2 2 4 2 7 4 2 7 2 2 7 0 7 2\n2 3 0 3 7 3 0 2 7 2 0 2 2 3 2 3 2\n2 4 7 3 0 0 4 2 4 2 4 0 7 0 3 3 0\n7 3 2 4 3 2 0 0 7 2 0 3 2 2 3 0 2\n2 7 3 7 2 2 2 0 2 2 7 4 2 2 3 0 3\n0 3 0 0 2 3 0 2 2 0 7 7 3 2 0 0 0\n2 0 0 4 0 2 2 2 0 4 4 0 7 0 0 3 2\n3 2 7 0 7 8 0 8 0 4 2 2 2 2 0 0 0\n7 2 3 4 3 2 8 8 2 0 4 0 3 7 0 3 2\n7 7 2 2 0 7 7 4 2 3 2 7 2 2 7 2 3\n0 0 0 4 2 3 0 4 7 7 3 0 7 2 0 3 0\n0 0 7 2 3 0 2 3 0 3 4 2 3 3 3 2 3\n7 2 2 2 2 3 0 3 0 3 3 0 7 0 3 3 2\n\nOutput:\n2 7 7 0 0 3 3 2 2 0 0 2 3 3 7 0 0\n0 3 7 2 2 4 2 7 4 2 7 2 2 7 0 7 2\n2 3 0 3 7 3 0 2 7 2 0 2 2 8 2 8 2\n2 4 7 3 0 0 4 2 4 2 4 0 7 0 8 8 0\n7 3 2 4 3 2 0 0 7 2 0 3 2 2 3 0 2\n2 7 3 7 2 2 2 0 2 2 7 4 2 2 3 0 3\n0 3 0 0 2 3 0 2 2 0 7 7 3 2 0 0 0\n2 0 0 4 0 2 2 2 0 4 4 0 7 0 0 3 2\n3 2 7 0 7 8 0 8 0 4 2 2 2 2 0 0 0\n7 2 3 4 3 2 8 8 2 0 4 0 3 7 0 3 2\n7 7 2 2 0 7 7 4 2 3 2 7 2 2 7 2 3\n0 0 0 4 2 3 0 4 7 7 8 0 7 2 0 8 0\n0 0 7 2 3 0 2 3 0 8 4 2 3 3 8 2 3\n7 2 2 2 2 3 0 3 0 8 8 0 7 0 8 8 2\n\nTraining Example 3:\nInput:\n3 0 0 7 3 3 3 2 2 3 3 2 0 2 4 7 2 0\n0 2 4 0 2 0 7 0 0 2 0 3 2 2 2 2 2 7\n7 0 2 3 0 4 4 7 2 7 7 0 4 0 4 3 0 3\n7 3 0 2 4 3 7 2 0 2 0 3 3 2 2 7 4 0\n0 3 4 3 2 4 3 8 0 2 3 3 4 0 3 0 3 0\n0 2 2 0 7 3 8 8 8 4 3 0 7 3 4 2 2 2\n2 3 2 4 7 0 7 2 0 4 0 0 0 0 7 0 4 7\n3 4 7 7 0 3 2 0 0 7 3 0 2 7 4 2 0 3\n2 3 0 3 3 0 0 2 2 0 7 7 3 0 2 2 2 3\n0 3 3 4 0 3 0 0 2 7 3 0 0 0 2 3 7 3\n0 3 4 3 0 7 2 0 3 0 3 3 0 4 0 2 3 3\n3 2 0 4 0 2 7 3 7 0 3 3 2 0 0 2 2 7\n2 2 3 3 4 3 7 7 2 2 4 0 0 0 4 2 3 2\n0 2 0 2 0 0 4 0 0 3 7 0 0 0 4 3 4 2\n0 4 3 0 0 3 0 0 7 0 0 0 2 3 3 7 4 3\n\nOutput:\n3 0 0 7 3 3 3 2 2 3 3 2 0 2 4 7 2 0\n0 2 4 0 2 0 7 0 0 2 0 3 2 2 2 2 2 7\n7 0 2 3 0 4 4 7 2 7 7 0 4 0 4 3 0 3\n7 3 0 2 4 3 7 2 0 2 0 3 3 2 2 7 4 0\n0 3 4 3 2 4 3 8 0 2 3 3 4 0 3 0 3 0\n0 2 2 0 7 3 8 8 8 4 3 0 7 3 4 2 2 2\n2 3 2 4 7 0 7 2 0 4 0 0 0 0 7 0 4 7\n3 4 7 7 0 3 2 0 0 7 3 0 2 7 4 2 0 3\n2 8 0 3 3 0 0 2 2 0 7 7 3 0 2 2 2 3\n0 8 8 4 0 3 0 0 2 7 8 0 0 0 2 3 7 3\n0 8 4 3 0 7 2 0 3 0 8 8 0 4 0 2 3 3\n3 2 0 4 0 2 7 3 7 0 8 3 2 0 0 2 2 7\n2 2 3 3 4 3 7 7 2 2 4 0 0 0 4 2 3 2\n0 2 0 2 0 0 4 0 0 3 7 0 0 0 4 3 4 2\n0 4 3 0 0 3 0 0 7 0 0 0 2 3 3 7 4 3\n\nTraining Example 4:\nInput:\n2 3 2 8 4 4 0 2 3 0 2 4 7 7 3 7 3\n3 4 8 8 8 0 0 2 0 2 0 2 7 7 7 3 7\n7 3 0 8 0 2 2 0 2 2 0 7 3 0 3 3 3\n2 0 2 0 2 0 3 2 0 7 0 7 0 0 2 3 0\n7 7 4 3 7 2 0 2 3 0 3 4 7 2 0 3 7\n2 4 0 7 0 0 3 4 4 0 3 4 4 3 3 4 0\n3 2 7 3 7 3 7 2 0 2 3 2 3 3 3 4 4\n3 7 4 0 2 0 2 0 3 7 2 3 3 3 3 0 2\n3 2 3 2 0 2 0 2 0 7 2 0 2 4 4 7 3\n4 3 4 2 0 7 0 0 7 0 0 0 0 3 0 0 3\n2 3 0 0 4 0 2 0 3 3 2 0 4 0 0 2 2\n3 3 4 3 2 7 2 4 3 0 7 3 3 4 2 0 3\n2 0 7 7 0 3 7 4 3 7 0 2 0 3 7 0 2\n2 3 0 0 2 3 0 7 0 7 3 7 0 4 0 3 7\n2 0 2 2 7 2 0 0 2 2 3 0 0 3 7 0 3\n7 2 4 0 3 0 0 2 2 7 4 0 0 2 2 0 4\n0 0 3 0 4 4 7 7 4 2 0 0 3 7 0 2 0\n2 3 4 0 3 0 3 3 2 3 4 7 7 0 2 0 3\n\nOutput:\n2 3 2 8 4 4 0 2 3 0 2 4 7 7 3 7 3\n3 4 8 8 8 0 0 2 0 2 0 2 7 7 7 8 7\n7 3 0 8 0 2 2 0 2 2 0 7 3 0 8 8 8\n2 0 2 0 2 0 3 2 0 7 0 7 0 0 2 8 0\n7 7 4 3 7 2 0 2 3 0 3 4 7 2 0 3 7\n2 4 0 7 0 0 3 4 4 0 3 4 4 8 3 4 0\n3 2 7 3 7 3 7 2 0 2 3 2 8 8 8 4 4\n3 7 4 0 2 0 2 0 3 7 2 3 3 8 3 0 2\n3 2 3 2 0 2 0 2 0 7 2 0 2 4 4 7 3\n4 3 4 2 0 7 0 0 7 0 0 0 0 3 0 0 3\n2 3 0 0 4 0 2 0 3 3 2 0 4 0 0 2 2\n3 3 4 3 2 7 2 4 3 0 7 3 3 4 2 0 3\n2 0 7 7 0 3 7 4 3 7 0 2 0 3 7 0 2\n2 3 0 0 2 3 0 7 0 7 3 7 0 4 0 3 7\n2 0 2 2 7 2 0 0 2 2 3 0 0 3 7 0 3\n7 2 4 0 3 0 0 2 2 7 4 0 0 2 2 0 4\n0 0 3 0 4 4 7 7 4 2 0 0 3 7 0 2 0\n2 3 4 0 3 0 3 3 2 3 4 7 7 0 2 0 3\n\nTest Input:\n7 3 2 2 4 3 7 2 7 0 7 3 4 0 3 2 4\n0 2 2 2 2 3 0 3 3 0 3 2 0 0 3 0 7\n3 2 0 3 7 0 2 2 2 3 7 0 3 3 0 2 2\n4 2 7 7 0 0 2 0 0 0 7 4 3 2 3 7 2\n7 0 8 3 0 7 3 3 0 2 3 0 4 0 0 7 0\n3 4 8 8 3 2 0 0 3 4 2 4 0 3 3 2 4\n2 3 0 8 0 0 2 4 0 4 4 0 0 7 2 3 0\n2 4 0 3 0 0 2 2 3 2 7 3 3 7 0 4 0\n2 7 7 4 0 3 0 2 7 7 0 4 7 0 7 3 3\n0 0 7 3 4 0 2 3 0 7 4 3 2 3 0 7 3\n2 7 0 3 4 7 3 4 0 4 0 0 0 3 3 7 2\n4 3 0 2 3 0 4 0 4 3 3 2 2 3 3 0 3\n4 7 0 7 3 3 2 3 3 0 7 0 0 0 0 4 7\n3 3 3 3 0 4 3 4 4 7 3 7 0 0 0 3 0\n0 2 2 3 3 3 0 7 3 2 7 3 4 3 3 3 3\n3 3 3 4 7 4 3 3 3 0 0 4 0 7 0 4 3\n\nGive your answer in ... tags, space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 7, + 3, + 2, + 2, + 4, + 3, + 7, + 2, + 7, + 0, + 7, + 3, + 4, + 0, + 3, + 2, + 4 + ], + [ + 0, + 2, + 2, + 2, + 2, + 3, + 0, + 3, + 3, + 0, + 3, + 2, + 0, + 0, + 3, + 0, + 7 + ], + [ + 3, + 2, + 0, + 3, + 7, + 0, + 2, + 2, + 2, + 3, + 7, + 0, + 3, + 3, + 0, + 2, + 2 + ], + [ + 4, + 2, + 7, + 7, + 0, + 0, + 2, + 0, + 0, + 0, + 7, + 4, + 3, + 2, + 3, + 7, + 2 + ], + [ + 7, + 0, + 8, + 3, + 0, + 7, + 3, + 3, + 0, + 2, + 3, + 0, + 4, + 0, + 0, + 7, + 0 + ], + [ + 3, + 4, + 8, + 8, + 3, + 2, + 0, + 0, + 3, + 4, + 2, + 4, + 0, + 3, + 3, + 2, + 4 + ], + [ + 2, + 3, + 0, + 8, + 0, + 0, + 2, + 4, + 0, + 4, + 4, + 0, + 0, + 7, + 2, + 3, + 0 + ], + [ + 2, + 4, + 0, + 3, + 0, + 0, + 2, + 2, + 3, + 2, + 7, + 3, + 3, + 7, + 0, + 4, + 0 + ], + [ + 2, + 7, + 7, + 4, + 0, + 3, + 0, + 2, + 7, + 7, + 0, + 4, + 7, + 0, + 7, + 3, + 3 + ], + [ + 0, + 0, + 7, + 3, + 4, + 0, + 2, + 3, + 0, + 7, + 4, + 3, + 2, + 8, + 0, + 7, + 3 + ], + [ + 2, + 7, + 0, + 3, + 4, + 7, + 3, + 4, + 0, + 4, + 0, + 0, + 0, + 8, + 8, + 7, + 2 + ], + [ + 4, + 3, + 0, + 2, + 3, + 0, + 4, + 0, + 4, + 3, + 3, + 2, + 2, + 3, + 8, + 0, + 3 + ], + [ + 4, + 7, + 0, + 7, + 3, + 3, + 2, + 3, + 3, + 0, + 7, + 0, + 0, + 0, + 0, + 4, + 7 + ], + [ + 3, + 3, + 8, + 8, + 0, + 4, + 3, + 4, + 4, + 7, + 3, + 7, + 0, + 0, + 0, + 8, + 0 + ], + [ + 0, + 2, + 2, + 8, + 8, + 3, + 0, + 7, + 3, + 2, + 7, + 3, + 4, + 3, + 3, + 8, + 8 + ], + [ + 3, + 3, + 3, + 4, + 7, + 4, + 3, + 3, + 3, + 0, + 0, + 4, + 0, + 7, + 0, + 4, + 8 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_13e47133.json b/problems/arc2_13e47133.json new file mode 100644 index 0000000..0308a4d --- /dev/null +++ b/problems/arc2_13e47133.json @@ -0,0 +1,1932 @@ +{ + "problem_id": "arc2_13e47133", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n7 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 8\n1 8 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 4 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 3 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 2 1 1 1\n1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n7 7 7 7 7 7 7 7 2 8 8 8 8 8 8 8 8 8 8 8\n7 8 8 8 8 8 8 7 2 8 4 4 4 4 4 4 4 4 4 8\n7 8 7 7 7 7 8 7 2 8 4 8 8 8 8 8 8 8 4 8\n7 8 7 8 8 7 8 7 2 8 4 8 4 4 4 4 4 8 4 8\n7 8 7 8 8 7 8 7 2 8 4 8 4 8 8 8 4 8 4 8\n7 8 7 8 8 7 8 7 2 8 4 8 4 4 4 4 4 8 4 8\n7 8 7 8 8 7 8 7 2 8 4 8 8 8 8 8 8 8 4 8\n7 8 7 8 8 7 8 7 2 8 4 4 4 4 4 4 4 4 4 8\n7 8 7 8 8 7 8 7 2 8 8 8 8 8 8 8 8 8 4 8\n7 8 7 8 8 7 8 7 2 2 2 2 2 2 2 2 2 8 4 8\n7 8 7 8 8 7 8 7 2 3 3 3 3 3 3 3 2 8 4 8\n7 8 7 8 8 7 8 7 2 3 3 3 3 3 3 3 2 8 4 8\n7 8 7 8 8 7 8 7 2 3 3 3 3 3 3 3 2 8 4 8\n7 8 7 8 8 7 8 7 2 3 3 3 3 3 3 3 2 8 4 8\n7 8 7 8 8 7 8 7 2 3 3 3 3 3 3 3 2 8 4 8\n7 8 7 8 8 7 8 7 2 2 2 2 2 2 2 2 2 8 4 8\n7 8 7 8 8 7 8 7 2 8 8 8 8 8 8 8 8 8 4 8\n7 8 7 7 7 7 8 7 2 8 4 4 4 4 4 4 4 4 4 8\n7 8 8 8 8 8 8 7 2 8 4 4 4 4 4 4 4 4 4 8\n7 7 7 7 7 7 7 7 2 8 8 8 8 8 8 8 8 8 8 8\n\nTraining Example 2:\nInput:\n4 4 4 4 4 4 4 4 4 4 2 8 4 4 4 4 4 4 4 4\n4 3 4 4 4 4 4 4 4 4 2 4 1 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 2 2 2 2 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 2 5 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 0 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 1 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4\n\nOutput:\n4 4 4 4 4 4 4 4 4 4 2 8 8 8 8 8 8 8 8 8\n4 3 3 3 3 3 3 3 3 4 2 8 1 1 1 1 1 1 1 8\n4 3 4 4 4 4 4 4 3 4 2 8 1 8 8 8 8 8 1 8\n4 3 4 3 3 3 3 4 3 4 2 8 1 8 1 1 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 1 8 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 1 8 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 1 8 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 1 8 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 1 1 1 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 8 8 8 8 8 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 1 1 1 1 1 1 1 8\n4 3 4 3 4 4 3 4 3 4 2 8 8 8 8 8 8 8 8 8\n4 3 4 3 4 4 3 4 3 4 2 2 2 2 2 2 2 2 2 2\n4 3 4 3 4 4 3 4 3 4 2 5 5 5 5 5 5 5 5 5\n4 3 4 3 4 4 3 4 3 4 2 5 0 0 0 0 0 0 0 5\n4 3 4 3 4 4 3 4 3 4 2 5 0 1 1 1 1 1 0 5\n4 3 4 3 3 3 3 4 3 4 2 5 0 1 5 5 5 1 0 5\n4 3 4 4 4 4 4 4 3 4 2 5 0 1 1 1 1 1 0 5\n4 3 3 3 3 3 3 3 3 4 2 5 0 0 0 0 0 0 0 5\n4 4 4 4 4 4 4 4 4 4 2 5 5 5 5 5 5 5 5 5\n\nTraining Example 3:\nInput:\n9 8 8 8 8 8 6 8 8 8 8 8 7\n8 1 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 6 6 6 6 6 6\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n8 8 8 8 8 8 6 8 8 8 8 8 8\n\nOutput:\n9 9 9 9 9 9 6 7 7 7 7 7 7\n9 1 1 1 1 9 6 7 7 7 7 7 7\n9 1 9 9 1 9 6 7 7 7 7 7 7\n9 1 9 9 1 9 6 7 7 7 7 7 7\n9 1 9 9 1 9 6 7 7 7 7 7 7\n9 1 9 9 1 9 6 7 7 7 7 7 7\n9 1 9 9 1 9 6 6 6 6 6 6 6\n9 1 9 9 1 9 6 8 8 8 8 8 8\n9 1 1 1 1 9 6 8 8 8 8 8 8\n9 9 9 9 9 9 6 8 8 8 8 8 8\n\nTest Input 1:\n1 3 3 3 3 3 3 3 3 3 3 8 6 3 3 3 3 3 3 3 8 2 3 3 3 3 3 3 3 3\n3 2 3 3 3 3 3 3 3 3 3 8 3 4 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 5 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 8 8 8 8 8 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 4 3 3 3 3 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 3 1 3 3 3 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 8 8 8 8 8 8 8\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 8 8 8 8 8 8 8 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 8 3 4 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3 3 3 8 3 3 3 3 3 3 3 3 3 3\n\nTest Input 2:\n8 8 8 8 8 8 4 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 3 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 4 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 2 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n8 8 8 8 8 8 6 1 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 5 8 1 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 4 8 8 1 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 7 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 2 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 1 1 1 1 1 1 1 1 1 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 4 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 2 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 1 1 1 1 1 1 1 1\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 9 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 8 2 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 8, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 1, + 8, + 6, + 4, + 4, + 4, + 4, + 4, + 4, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 5, + 5, + 5, + 4, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 2, + 2, + 2, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 6, + 6, + 5, + 4, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 1, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 5, + 5, + 5, + 4, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 4, + 4, + 4, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 6, + 6, + 6, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 4, + 4, + 4, + 4, + 8, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 1, + 1, + 1, + 4, + 8, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 1, + 4, + 1, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 1, + 4, + 1, + 4, + 8, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 1, + 1, + 1, + 4, + 8, + 6, + 4, + 4, + 4, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 4, + 4, + 4, + 4, + 4, + 8, + 6, + 4, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 4, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 4, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 6, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 1, + 1, + 1, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 6, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 2, + 2, + 2, + 2, + 2, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 2, + 1, + 8, + 6, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 1, + 8, + 6, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 5, + 6, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 8, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 4, + 5, + 6, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 2, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 4, + 5, + 6, + 4, + 4, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 2, + 1, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 6, + 4, + 5, + 6, + 6, + 6, + 6, + 5, + 4, + 6 + ], + [ + 1, + 2, + 1, + 1, + 2, + 1, + 8, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 8, + 6, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 6 + ], + [ + 1, + 2, + 2, + 2, + 2, + 1, + 8, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 8, + 6, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 6 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ] + ], + [ + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 1, + 2, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 2 + ], + [ + 4, + 3, + 4, + 4, + 4, + 3, + 4, + 1, + 2, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 2 + ], + [ + 4, + 3, + 4, + 3, + 4, + 3, + 4, + 1, + 2, + 3, + 4, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 4, + 3, + 2 + ], + [ + 4, + 3, + 4, + 3, + 4, + 3, + 4, + 1, + 2, + 3, + 4, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 4, + 3, + 2 + ], + [ + 4, + 3, + 4, + 4, + 4, + 3, + 4, + 1, + 2, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 2 + ], + [ + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 1, + 2, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 6, + 5, + 5, + 5, + 5, + 5, + 6, + 1, + 2, + 7, + 7, + 7, + 7, + 7, + 7, + 2, + 1, + 4, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4 + ], + [ + 6, + 5, + 4, + 4, + 4, + 5, + 6, + 1, + 2, + 7, + 2, + 2, + 2, + 2, + 7, + 2, + 1, + 4, + 9, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 2, + 7, + 2, + 2, + 2, + 2, + 7, + 2, + 1, + 4, + 9, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 2, + 7, + 7, + 7, + 7, + 7, + 7, + 2, + 1, + 4, + 9, + 2, + 4, + 9, + 9, + 9, + 9, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 2, + 2, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 4, + 2, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 9, + 2, + 4, + 9, + 2, + 4, + 2, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 2, + 4, + 9, + 2, + 2, + 2, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 4, + 9, + 9, + 9, + 9, + 9, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 9, + 9, + 9, + 9, + 4, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 2, + 2, + 9, + 4, + 2, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 4, + 2, + 9, + 4, + 2, + 9, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 4, + 2, + 9, + 4, + 2, + 9, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 2, + 2, + 2, + 9, + 4, + 2, + 9, + 4, + 1, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 9, + 9, + 9, + 9, + 9, + 4, + 2, + 9, + 4, + 1, + 9, + 2, + 2, + 2, + 2, + 2, + 2, + 9 + ], + [ + 6, + 5, + 4, + 6, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 9, + 4, + 1, + 9, + 2, + 9, + 9, + 9, + 9, + 2, + 9 + ], + [ + 6, + 5, + 4, + 4, + 4, + 5, + 6, + 1, + 4, + 9, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 9, + 4, + 1, + 9, + 2, + 9, + 9, + 9, + 9, + 2, + 9 + ], + [ + 6, + 5, + 5, + 5, + 5, + 5, + 6, + 1, + 4, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4, + 1, + 9, + 2, + 2, + 2, + 2, + 2, + 2, + 9 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_21897d95.json b/problems/arc2_21897d95.json new file mode 100644 index 0000000..c2ac06f --- /dev/null +++ b/problems/arc2_21897d95.json @@ -0,0 +1,1596 @@ +{ + "problem_id": "arc2_21897d95", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n6 6 6 6 6 7 7 7 4 4 4 4\n6 6 6 6 6 7 7 7 4 4 4 4\n6 6 6 1 6 7 7 7 4 4 4 4\n6 6 6 3 1 7 7 7 4 9 9 9\n6 6 6 1 6 7 7 7 4 4 4 9\n6 6 6 6 6 7 7 7 4 4 4 9\n6 6 6 6 6 7 1 7 4 4 4 4\n6 6 6 6 6 7 1 1 4 4 4 4\n6 6 6 6 6 7 1 7 4 4 4 4\n6 6 6 6 6 7 7 7 4 4 4 4\n7 7 1 7 7 7 7 7 7 7 7 7\n7 1 0 1 7 7 7 7 7 1 1 1\n7 7 7 7 7 7 7 7 7 7 1 7\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n7 7 7 7 7 7 7 7 7 7 3 3 3 7 7 7\n7 7 7 7 7 7 7 7 7 7 3 3 3 7 7 7\n7 7 7 7 7 7 7 7 7 7 3 3 3 7 7 7\n7 7 7 7 7 7 7 7 7 7 3 3 3 7 7 7\n3 3 3 3 3 3 3 3 3 3 3 3 3 7 7 7\n3 3 3 3 3 3 3 3 3 3 3 3 3 7 7 7\n3 3 3 3 3 3 3 3 3 3 3 3 3 7 7 7\n0 0 0 0 0 0 0 0 0 0 3 3 3 7 7 7\n0 0 0 0 0 0 0 0 0 0 3 3 3 7 7 7\n0 0 0 0 0 0 0 0 0 0 3 3 3 7 7 7\n0 0 0 0 0 0 0 0 0 0 3 3 3 7 7 7\n0 0 0 0 0 0 0 0 0 0 3 3 3 7 7 7\n\nTraining Example 2:\nInput:\n7 7 7 7 7 7 1 7 3 3\n7 7 7 7 7 7 1 1 3 3\n7 7 7 7 7 7 1 7 3 3\n8 8 8 3 1 7 7 7 3 1\n8 8 8 1 1 7 7 7 1 6\n8 1 8 3 1 7 7 7 3 1\n8 1 1 3 3 1 9 1 3 3\n8 1 8 3 3 7 1 7 3 3\n8 8 8 3 3 5 5 5 3 3\n8 8 8 3 3 5 5 5 3 3\n\nOutput:\n6 6 6 6 6 6 6 6 7 7\n6 6 6 6 6 6 6 6 7 7\n6 6 6 6 6 6 6 6 7 7\n3 3 3 8 8 6 6 6 7 7\n3 3 3 8 8 6 6 6 7 7\n3 3 3 8 8 6 6 6 7 7\n3 3 3 8 8 6 6 6 7 7\n3 3 3 8 8 6 6 6 7 7\n3 3 3 8 8 9 9 9 7 7\n3 3 3 8 8 9 9 9 7 7\n\nTraining Example 3:\nInput:\n6 6 6 3 1 3 3 3 3\n6 6 6 1 1 3 3 3 3\n6 6 6 3 1 3 3 3 3\n6 6 6 4 4 4 4 1 4\n6 6 6 4 4 4 1 1 1\n6 6 6 4 4 4 4 4 4\n6 6 6 6 1 6 4 4 4\n6 6 6 6 1 1 4 4 4\n6 6 6 6 1 6 4 4 4\n5 5 5 4 4 4 4 4 4\n9 9 9 8 8 8 8 8 8\n9 5 5 8 8 8 1 7 1\n9 5 5 8 8 8 8 1 8\n5 5 5 4 4 4 4 4 4\n\nOutput:\n5 5 5 5 5 3 3 3 3 3 3 3 3 3\n5 5 5 5 5 3 3 3 3 3 3 3 3 3\n5 5 5 5 5 3 3 3 3 3 3 3 3 3\n7 8 8 8 6 3 3 3 6 6 6 4 4 4\n7 8 8 8 6 3 3 3 6 6 6 4 4 4\n7 8 8 8 6 3 3 3 6 6 6 4 4 4\n7 8 8 8 6 6 6 6 6 6 6 4 4 4\n7 8 8 8 6 6 6 6 6 6 6 4 4 4\n7 8 8 8 6 6 6 6 6 6 6 4 4 4\n\nTraining Example 4:\nInput:\n2 2 2 2 2 1 2 3 3 3\n2 2 2 2 2 1 1 3 3 3\n2 2 2 2 2 1 2 3 3 3\n6 6 6 6 1 6 6 3 1 3\n6 6 6 1 1 1 6 1 1 3\n1 1 1 6 6 6 6 3 1 3\n6 1 6 6 6 6 6 3 3 3\n4 4 4 4 4 4 4 3 3 3\n4 4 4 4 4 4 4 3 3 3\n4 4 4 4 4 4 4 3 3 3\n\nOutput:\n6 6 6 6 6 6 6 2 2 2\n6 6 6 6 6 6 6 2 2 2\n6 6 6 6 6 6 6 2 2 2\n3 3 3 3 3 3 3 2 2 2\n3 3 3 3 3 3 3 2 2 2\n3 3 3 3 3 3 3 2 2 2\n3 3 3 3 3 3 3 2 2 2\n6 6 6 6 6 6 6 2 2 2\n6 6 6 6 6 6 6 2 2 2\n6 6 6 6 6 6 6 2 2 2\n\nTest Input 1:\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 7 7 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 3 3 3 1 3 3 3 3 3 3 9 9 9 7 7 7 7 9 9\n9 9 9 9 3 3 3 3 3 3 3 3 3 1 1 1 3 3 3 3 3 9 9 9 7 7 7 7 9 9\n9 9 9 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 9 9 7 7 7 7 9 9\n9 9 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 9 9 9 1 9 9 9 9\n9 9 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 9 9 1 1 1 9 9 4\n9 3 3 3 3 0 1 0 0 0 0 0 0 0 0 0 3 3 3 3 3 3 9 9 9 9 9 9 4 4\n9 3 3 3 0 1 8 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 9 9 9 9 9 4 4 4\n9 3 3 0 0 0 0 0 0 0 0 0 0 2 1 2 2 0 0 0 0 0 9 9 9 9 9 4 4 4\n9 3 3 0 0 0 0 0 0 0 2 2 2 1 1 1 2 2 2 2 0 0 9 9 9 9 4 4 4 4\n9 3 3 0 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 0 9 9 9 9 4 4 4 4\n9 3 3 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 2 2 9 9 9 9 4 4 4 4\n9 3 3 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 9 9 4 4 4 4 4\n6 6 6 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 9 9 4 4 4 4 4\n6 6 6 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 9 9 4 4 4 4 4\n6 6 6 6 0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 2 2 2 2 9 9 4 4 4 4 4\n6 6 6 6 0 0 1 1 1 0 0 0 0 0 0 2 2 2 2 2 2 2 2 2 9 4 4 4 4 4\n6 6 6 6 6 6 0 1 0 0 0 0 0 0 2 2 2 2 2 2 2 2 2 2 9 4 4 4 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 0 0 2 2 2 2 2 2 2 2 2 2 9 4 4 4 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 1 6 2 2 2 2 2 2 2 2 2 2 9 9 4 4 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 1 1 2 2 2 2 2 2 2 2 2 9 9 9 4 4 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 1 6 9 2 2 2 2 2 2 2 2 9 9 9 8 8 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 9 2 2 2 2 2 2 2 9 9 9 8 8 8 4 4\n6 6 6 6 6 6 6 6 6 6 6 6 6 9 9 9 2 2 2 2 9 9 9 9 8 8 8 8 4 4\n6 6 6 6 6 6 6 6 6 6 6 9 9 9 9 9 9 9 9 9 9 9 8 8 8 8 8 8 1 8\n6 6 6 6 6 9 9 9 9 9 9 9 9 9 9 9 8 8 8 8 8 8 8 8 8 8 8 1 1 1\n9 9 9 9 9 9 9 9 9 9 9 9 1 9 9 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n9 9 9 9 9 9 9 9 9 9 9 9 0 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n9 9 9 9 9 9 9 9 9 9 9 9 1 9 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nTest Input 2:\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 1 1 1 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 1 5 5\n3 3 1 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 1 1 1 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 9 9 9 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 9 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 9 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 1 7 1 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 8 8 1 8 8 8 8 8 8 8 8 8 6 6 6 6 6 6\n3 3 3 3 3 3 4 4 4 4 4 4 1 4 4 4 4 4 6 6 6 6 6 6\n3 3 3 3 3 3 4 4 4 4 4 1 1 1 4 4 4 4 6 6 6 6 6 6\n3 3 3 3 3 3 4 4 4 4 4 4 4 4 4 4 4 4 6 6 1 1 1 6\n3 3 3 3 3 3 4 4 4 4 4 4 4 4 4 4 4 4 6 6 6 1 6 6\n2 2 1 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 1 1 1 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 9, + 9, + 9, + 9, + 3, + 3 + ], + [ + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 9, + 9, + 9, + 9, + 3, + 3 + ], + [ + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 9, + 9, + 9, + 9, + 3, + 3 + ], + [ + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 3, + 8, + 8, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 8 + ], + [ + 3, + 8, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8 + ], + [ + 3, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 2, + 2, + 2, + 2, + 2, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8 + ], + [ + 3, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 2, + 2, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8 + ], + [ + 3, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 2, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8 + ], + [ + 3, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8 + ], + [ + 3, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 0, + 0, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 0, + 0, + 0, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 6, + 6, + 6, + 6 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_269e22fb.json b/problems/arc2_269e22fb.json new file mode 100644 index 0000000..c0d3ec4 --- /dev/null +++ b/problems/arc2_269e22fb.json @@ -0,0 +1,892 @@ +{ + "problem_id": "arc2_269e22fb", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n7 7 8 8 8 8 8 8 8 8\n7 7 7 7 7 7 8 8 8 8\n7 7 7 7 7 7 7 8 8 8\n7 7 8 8 8 7 7 7 8 8\n8 8 8 8 8 8 7 7 7 8\n8 8 8 8 8 8 8 7 7 7\n8 8 8 8 8 8 8 8 7 7\n8 8 8 8 8 8 8 8 8 7\n\nOutput:\n7 7 8 8 8 8 8 8 8 8 8 8 8 8 8 7 7 8 8 8\n7 7 7 7 7 7 8 8 8 8 8 8 8 8 8 7 7 8 8 8\n7 7 7 7 7 7 7 8 8 8 8 8 8 8 8 7 7 7 8 8\n7 7 8 8 8 7 7 7 8 8 8 8 8 8 8 7 7 7 8 8\n8 8 8 8 8 8 7 7 7 8 8 8 8 8 7 7 7 7 7 8\n8 8 8 8 8 8 8 7 7 7 8 8 8 8 7 8 8 7 7 8\n8 8 8 8 8 8 8 8 7 7 8 8 7 7 7 8 8 7 7 8\n8 8 8 8 8 8 8 8 8 7 8 8 7 8 7 8 8 7 7 8\n8 8 8 8 8 8 8 8 8 7 7 7 7 8 7 8 8 7 7 8\n8 7 7 7 7 7 7 7 7 7 8 7 7 8 7 8 8 7 7 8\n8 7 8 8 8 8 8 8 8 7 7 7 7 8 7 8 8 7 7 8\n8 7 7 7 7 7 7 7 7 7 8 8 7 8 7 8 8 7 7 8\n8 7 8 7 8 8 8 8 8 7 8 8 7 7 7 8 8 7 7 8\n7 7 7 8 7 7 7 7 7 7 8 8 8 8 7 8 8 7 7 8\n8 7 8 7 7 8 8 8 8 7 8 8 8 8 7 7 7 7 7 8\n7 7 7 8 7 8 8 8 8 7 8 8 8 7 7 8 7 7 8 8\n8 7 8 7 7 8 8 8 8 7 8 8 8 7 8 8 8 7 7 8\n7 7 7 8 7 8 8 8 8 7 8 8 8 7 7 8 8 8 7 7\n8 7 8 7 7 8 8 8 7 8 7 8 8 8 7 8 7 7 7 8\n7 7 7 8 8 8 8 7 8 8 8 7 8 8 7 7 7 8 8 8\n\nTraining Example 2:\nInput:\n8 8 7 8 8 8 7 8\n8 8 8 7 8 7 8 8\n7 8 8 8 7 8 8 8\n7 8 8 8 7 8 8 8\n7 8 8 8 7 8 8 8\n8 8 8 8 7 8 8 8\n8 8 8 8 7 7 7 7\n7 7 8 8 7 8 8 8\n8 7 8 8 7 7 7 7\n8 7 7 7 7 8 8 8\n8 7 7 8 7 7 7 7\n8 7 7 7 7 8 8 8\n8 7 8 8 7 8 8 8\n7 7 8 8 7 7 8 8\n8 8 8 8 7 7 7 8\n8 8 8 8 8 7 7 7\n\nOutput:\n8 8 8 7 7 7 8 8 7 8 8 8 7 8 8 8 8 7 7 7\n8 7 7 7 8 7 8 8 8 7 8 7 8 8 8 7 7 8 7 8\n7 7 8 8 8 7 7 8 8 8 7 8 8 8 8 7 8 7 7 7\n8 7 7 8 8 8 7 8 8 8 7 8 8 8 8 7 7 8 7 8\n8 8 7 7 8 7 7 8 8 8 7 8 8 8 8 7 8 7 7 7\n8 7 7 7 7 7 8 8 8 8 7 8 8 8 8 7 7 8 7 8\n8 7 7 8 8 7 8 8 8 8 7 7 7 7 7 7 8 7 7 7\n8 7 7 8 8 7 7 7 8 8 7 8 8 8 8 8 7 8 7 8\n8 7 7 8 8 7 8 7 8 8 7 7 7 7 7 7 7 7 7 8\n8 7 7 8 8 7 8 7 7 7 7 8 8 8 8 8 8 8 7 8\n8 7 7 8 8 7 8 7 7 8 7 7 7 7 7 7 7 7 7 8\n8 7 7 8 8 7 8 7 7 7 7 8 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 8 7 8 8 7 8 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 7 7 8 8 7 7 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 8 8 8 8 7 7 7 8 8 8 8 8 8 8\n8 7 7 7 7 7 8 8 8 8 8 7 7 7 8 8 8 8 8 8\n8 8 7 7 7 8 8 8 8 8 8 8 7 7 7 8 8 8 7 7\n8 8 7 7 7 8 8 8 8 8 8 8 8 7 7 7 7 7 7 7\n8 8 8 7 7 8 8 8 8 8 8 8 8 8 7 7 7 7 7 7\n8 8 8 7 7 8 8 8 8 8 8 8 8 8 8 8 8 8 7 7\n\nTraining Example 3:\nInput:\n0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 3 3 3 3 3\n0 0 3 3 3 3 3 3 3 3\n3 3 3 3 3 0 0 0 0 0\n3 3 3 3 3 0 0 0 0 0\n0 0 0 0 3 3 3 3 3 3\n0 0 0 0 0 0 3 0 0 0\n0 0 0 0 0 0 3 3 3 3\n0 0 0 0 0 0 0 0 3 3\n0 0 0 0 0 0 0 0 3 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 3 0 0\n0 0 0 0 3 3 3 3 3 3 3 3 3 3 3 0 3 3 3 0\n0 0 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 0 3 0\n3 3 3 3 3 0 0 0 0 0 0 0 0 0 3 3 0 0 3 3\n3 3 3 3 3 0 0 0 0 0 0 0 0 0 3 0 0 0 0 3\n0 0 0 0 3 3 3 3 3 3 3 3 3 3 3 3 0 3 3 3\n0 0 0 0 0 0 3 0 0 0 0 0 3 0 0 3 3 3 0 0\n0 0 0 0 0 0 3 3 3 3 3 3 3 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 3 3 3 0 0 0 0 0 0 0 0 3\n0 0 0 0 0 0 0 0 3 0 3 0 0 0 0 0 0 0 3 0\n0 0 0 0 0 3 3 3 3 3 3 3 3 3 3 3 3 3 0 0\n0 0 0 0 3 3 3 0 0 3 0 3 0 3 0 0 0 0 3 0\n0 0 0 3 3 3 0 0 0 3 0 3 0 3 0 0 0 0 0 3\n0 0 3 3 3 0 0 0 0 3 0 3 0 3 0 0 0 0 0 0\n0 3 3 3 0 0 0 0 0 3 0 3 0 3 0 0 0 0 0 0\n0 3 3 0 0 0 0 0 0 3 0 3 0 3 3 3 3 3 3 0\n0 3 3 0 0 0 0 0 0 3 0 3 3 0 3 0 3 0 3 0\n0 3 3 0 0 0 0 0 0 3 0 3 0 3 0 3 0 3 0 3\n3 3 3 3 0 0 0 0 0 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 0 0 0 0 0 0 0 0 0 3 0 3 0 3 0 3\n\nTraining Example 4:\nInput:\n8 8 7 7 7 8 8 8 8 8 8 8\n8 8 7 7 7 8 8 8 8 8 8 8\n8 7 7 7 7 7 8 8 8 8 8 7\n8 7 7 8 8 7 8 8 8 8 7 7\n8 7 7 8 8 7 7 7 8 8 7 7\n8 7 7 8 8 7 8 7 8 8 7 8\n8 7 7 8 8 7 8 7 7 7 7 8\n8 7 7 8 8 7 8 7 7 8 7 7\n8 7 7 8 8 7 8 7 7 7 7 8\n8 7 7 8 8 7 8 7 8 8 7 7\n8 7 7 8 8 7 7 7 8 8 7 8\n8 7 7 8 8 7 8 8 8 8 7 7\n8 7 7 7 7 7 8 8 8 8 7 8\n\nOutput:\n8 8 8 7 7 8 8 8 8 8 8 8 8 8 8 8 8 8 7 7\n8 8 8 7 7 8 8 8 8 8 8 8 8 8 7 7 7 7 7 7\n8 8 7 7 7 8 8 8 8 8 8 8 8 7 7 7 7 7 7 7\n8 8 7 7 7 8 8 8 8 8 8 8 7 7 7 8 8 8 7 7\n8 7 7 7 7 7 8 8 8 8 8 7 7 7 8 8 8 8 8 8\n8 7 7 8 8 7 8 8 8 8 7 7 7 8 8 8 8 8 8 8\n8 7 7 8 8 7 7 7 8 8 7 7 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 8 7 8 8 7 8 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 8 7 7 7 7 8 8 8 8 8 8 8 8 8\n8 7 7 8 8 7 8 7 7 8 7 7 7 7 7 7 7 7 7 8\n8 7 7 8 8 7 8 7 7 7 7 8 8 8 8 8 8 8 7 8\n8 7 7 8 8 7 8 7 8 8 7 7 7 7 7 7 7 7 7 8\n8 7 7 8 8 7 7 7 8 8 7 8 8 8 8 8 7 8 7 8\n8 7 7 8 8 7 8 8 8 8 7 7 7 7 7 7 8 7 7 7\n8 7 7 7 7 7 8 8 8 8 7 8 8 8 8 7 7 8 7 8\n8 8 7 7 8 7 7 8 8 8 7 8 8 8 8 7 8 7 7 7\n8 7 7 8 8 8 7 8 8 8 7 8 8 8 8 7 7 8 7 8\n7 7 8 8 8 7 7 8 8 8 7 8 8 8 8 7 8 7 7 7\n8 7 7 7 8 7 8 8 8 7 8 7 8 8 8 7 7 8 7 8\n8 8 8 7 7 7 8 8 7 8 8 8 7 8 8 8 8 7 7 7\n\nTraining Example 5:\nInput:\n8 7 8 7 8 8 8 8 8 7\n8 7 8 7 8 8 8 8 8 8\n8 7 8 7 8 8 8 8 8 8\n8 7 8 7 7 7 7 7 7 8\n8 7 7 8 7 8 7 8 7 8\n8 7 8 7 8 7 8 7 8 7\n7 7 7 7 7 7 7 7 7 7\n8 8 8 7 8 7 8 7 8 7\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 7 8 8\n8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 8 7 7 7 8\n8 8 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 8 7 8\n7 7 7 7 7 8 8 8 8 8 8 8 8 8 7 7 8 8 7 7\n7 7 7 7 7 8 8 8 8 8 8 8 8 8 7 8 8 8 8 7\n8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 7 8 7 7 7\n8 8 8 8 8 8 7 8 8 8 8 8 7 8 8 7 7 7 8 8\n8 8 8 8 8 8 7 7 7 7 7 7 7 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 7 7 7 8 8 8 8 8 8 8 8 7\n8 8 8 8 8 8 8 8 7 8 7 8 8 8 8 8 8 8 7 8\n8 8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 7 7 8 8\n8 8 8 8 7 7 7 8 8 7 8 7 8 7 8 8 8 8 7 8\n8 8 8 7 7 7 8 8 8 7 8 7 8 7 8 8 8 8 8 7\n8 8 7 7 7 8 8 8 8 7 8 7 8 7 8 8 8 8 8 8\n8 7 7 7 8 8 8 8 8 7 8 7 8 7 8 8 8 8 8 8\n8 7 7 8 8 8 8 8 8 7 8 7 8 7 7 7 7 7 7 8\n8 7 7 8 8 8 8 8 8 7 8 7 7 8 7 8 7 8 7 8\n8 7 7 8 8 8 8 8 8 7 8 7 8 7 8 7 8 7 8 7\n7 7 7 7 8 8 8 8 8 7 7 7 7 7 7 7 7 7 7 7\n7 7 7 7 8 8 8 8 8 8 8 8 8 7 8 7 8 7 8 7\n\nTest Input 1:\n8 7 8 7 8 7 8 7 7 7\n8 8 8 8 8 8 8 8 8 8\n8 7 8 7 8 7 8 7 8 7\n7 8 7 8 7 8 7 8 8 7\n7 8 8 8 8 8 8 7 8 7\n7 7 7 7 7 7 8 7 8 7\n7 7 7 7 7 7 8 7 8 7\n8 7 7 7 7 7 8 7 8 7\n7 8 7 7 7 7 8 7 8 7\n7 7 8 8 8 8 8 8 8 8\n\nTest Input 2:\n6 6 6 6 6 5 5 5 5 5\n5 5 5 5 5 5 6 6 6 6\n6 6 6 5 6 6 6 6 6 6\n5 5 5 5 6 6 6 6 6 6\n5 5 6 6 6 6 6 6 6 6\n6 5 6 6 6 6 6 6 6 6\n5 5 5 5 5 6 6 6 6 6\n5 6 6 5 5 5 6 6 6 6\n5 6 6 6 5 5 5 6 6 6\n5 6 6 6 6 5 5 5 6 6\n5 6 6 6 6 6 5 5 5 6\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 8, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 8 + ], + [ + 8, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 7 + ], + [ + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 8, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 7 + ], + [ + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 7 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 7 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 7, + 7 + ], + [ + 8, + 7, + 7, + 7, + 7, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 8, + 8, + 8, + 7, + 7, + 7 + ], + [ + 7, + 8, + 7, + 7, + 7, + 7, + 8, + 7, + 8, + 7, + 8, + 7, + 7, + 8, + 8, + 8, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7, + 7, + 7, + 7 + ], + [ + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 8, + 8, + 8, + 7, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 8, + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7, + 7, + 7 + ], + [ + 8, + 7, + 7, + 7, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 7, + 7, + 8, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 8, + 8, + 8, + 8, + 8 + ], + [ + 7, + 8, + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7 + ], + [ + 7, + 8, + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 8, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7 + ] + ], + [ + [ + 6, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 6, + 5, + 5, + 5, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 6, + 5, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6 + ], + [ + 5, + 5, + 6, + 6, + 5, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 6, + 6, + 6, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 6, + 6, + 5, + 5, + 5, + 6, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 6, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6, + 6 + ], + [ + 6, + 5, + 6, + 6, + 6, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 5, + 5, + 5, + 6, + 6, + 6, + 6 + ], + [ + 5, + 6, + 6, + 6, + 6, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 5, + 5, + 5, + 6, + 6, + 6 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 6, + 6 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 6 + ], + [ + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 6 + ], + [ + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 5, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 6 + ], + [ + 5, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 6 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 5 + ], + [ + 5, + 6, + 5, + 6, + 5, + 6, + 5, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 5, + 5, + 5, + 5 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_2b83f449.json b/problems/arc2_2b83f449.json new file mode 100644 index 0000000..b6279c8 --- /dev/null +++ b/problems/arc2_2b83f449.json @@ -0,0 +1,371 @@ +{ + "problem_id": "arc2_2b83f449", + "problem_text": "ARC Puzzle: Predict the test output grid.\n\nTraining Example 1:\nInput:\n3 8 8 8 8 8 8 0 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 7 7 7 0 0 0 7 7 7 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 7 7 7 0 0 0 0 7 7 7 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 7 7 7 0 0 7 7 7 0 0 0 0 7 7 7 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 7 7 7 0 0 0 7 7 7 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 0 8 8 3\n0 0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 7 7 7 0 0 0 0 0 7 7 7 0 0 0 0\n8 8 0 8 8 8 8 8 0 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 6 8 8 0 8 8 6 8 8 8 8 8 8 8 8\n0 0 0 8 6 8 0 0 0 8 6 8 0 0 0 0 0 0 0\n3 3 8 8 6 8 6 8 8 8 6 8 8 6 8 8 8 8 8\n0 0 0 0 0 8 6 8 0 0 0 0 8 6 8 0 0 0 0\n8 8 8 6 8 8 6 8 6 8 8 8 8 6 8 6 8 8 8\n0 0 8 6 8 0 0 8 6 8 0 0 0 0 8 6 8 0 0\n3 3 8 6 8 6 8 8 6 8 8 6 8 8 8 6 8 3 3\n0 0 0 0 8 6 8 0 0 0 8 6 8 0 0 0 0 0 0\n3 8 8 8 8 6 8 8 6 8 8 6 8 8 3 0 8 8 3\n0 0 0 0 0 0 0 8 6 8 0 0 0 0 0 0 0 0 0\n8 8 8 8 8 6 8 8 6 8 8 8 8 6 8 8 8 8 8\n0 0 0 0 8 6 8 0 0 0 0 0 8 6 8 0 0 0 0\n8 8 0 3 8 6 8 8 0 3 8 8 8 6 8 8 8 8 3\n\nTraining Example 2:\nInput:\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 7 7 7 0 0 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 0 0 7 7 7 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 7 7 7 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 7 7 7 0 0 0 0 0 7 7 7 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 6 8 8 8 8 8 8 8 8 8 8 8\n0 0 0 8 6 8 0 0 0 0 0 0 0 0 0 0\n3 3 8 8 6 8 8 8 8 8 8 8 6 8 8 8\n0 0 0 0 0 0 0 0 0 0 0 8 6 8 0 0\n8 8 8 8 8 8 6 8 8 8 8 8 6 8 3 3\n0 0 0 0 0 8 6 8 0 0 0 0 0 0 0 0\n8 8 8 6 8 8 6 8 8 8 8 6 8 8 8 8\n0 0 8 6 8 0 0 0 0 0 8 6 8 0 0 0\n3 3 8 6 8 8 8 6 8 8 8 6 8 8 3 3\n0 0 0 0 0 0 8 6 8 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 6 8 8 8 8 8 8 8 3\n\nTest Input:\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 7 7 7 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 0 0 0 7 7 7 0 0\n3 8 8 8 8 8 8 0 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 7 7 7 0 0 0 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 0 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 0 0 0 7 7 7 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0 0\n3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 7 7 7 0 0 0 0 0 0 7 7 7 0 0 0\n8 8 8 8 8 8 8 0 8 8 8 8 8 8 8 8 8\n\nGive your answer in ... tags, space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0 + ], + [ + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 6, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0 + ], + [ + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 0, + 3, + 8, + 8, + 8, + 8, + 6, + 8, + 3, + 3 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3 + ], + [ + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 3, + 3, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 3, + 0, + 8, + 8, + 8, + 8, + 8, + 3 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 3, + 3 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8 + ], + [ + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 6, + 8, + 0, + 0, + 0 + ], + [ + 3, + 8, + 8, + 6, + 8, + 8, + 3, + 0, + 3, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 3 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_446ef5d2.json b/problems/arc2_446ef5d2.json new file mode 100644 index 0000000..a130756 --- /dev/null +++ b/problems/arc2_446ef5d2.json @@ -0,0 +1,1180 @@ +{ + "problem_id": "arc2_446ef5d2", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 7 7 7\n8 8 8 8 8 8 8 8 8 7 7 7 7 7 7 8 8 2 2 2\n8 8 8 8 8 8 8 8 8 0 0 0 7 0 7 8 8 7 7 7\n8 8 8 8 8 8 8 8 8 0 7 0 0 0 7 8 8 7 7 7\n8 7 7 7 7 7 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 7 0 0 0 0 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 7 0 7 0 0 8 8 8 8 8 8 8 8 8 7 7 7 8 8\n8 7 7 7 7 7 8 8 8 8 8 8 8 8 8 2 2 7 8 8\n8 7 2 7 2 2 8 8 8 8 8 8 8 8 8 7 2 7 8 8\n8 7 2 2 2 7 8 8 8 8 8 8 8 8 8 7 7 7 4 8\n8 7 7 7 7 7 8 8 8 8 8 8 8 8 8 8 8 4 4 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 8 8\n8 8 8 8 8 8 8 7 0 0 0 0 0 0 0 7 0 7 8 8\n8 8 8 8 8 8 8 7 0 7 0 0 0 7 0 0 0 7 8 8\n8 8 8 8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 8 8\n8 8 8 8 8 8 8 7 2 7 2 2 2 2 2 2 2 7 8 8\n8 8 8 8 8 8 8 7 2 2 2 7 7 7 7 7 2 7 8 8\n8 8 8 8 8 8 8 7 7 7 7 7 7 7 7 7 7 7 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nTraining Example 2:\nInput:\n8 8 8 8 8 8 8 8 8 8\n8 4 4 8 8 8 9 9 3 8\n8 4 3 3 3 8 3 3 3 8\n8 8 3 9 9 8 3 3 3 8\n8 8 3 9 9 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8\n8 3 3 3 8 8 3 9 9 8\n8 9 9 3 8 8 3 9 3 8\n8 9 9 3 8 8 3 3 3 8\n8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8\n8 8 3 3 3 3 3 3 8 8\n8 8 3 9 9 9 9 3 8 8\n8 8 3 9 9 9 9 3 8 8\n8 8 3 9 9 9 9 3 8 8\n8 8 3 9 3 3 3 3 8 8\n8 8 3 3 3 3 3 3 8 8\n8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8\n\nTest Input 1:\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 4 1 1 1\n4 1 3 1 1 4 4 4 4 4 4 4 4 4 4 4 4 4 1 3 3 3 4 6 6 1\n4 1 3 3 3 4 4 4 4 4 4 4 4 4 4 4 4 4 1 3 1 1 4 1 6 1\n4 1 1 1 1 4 4 4 4 4 4 4 4 4 4 4 4 4 1 3 1 1 4 1 6 1\n4 1 1 1 1 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 6 6 1\n4 1 1 6 6 4 1 1 1 1 3 1 4 4 4 4 1 1 7 1 1 1 4 1 1 1\n4 1 1 6 1 4 3 3 3 3 3 1 4 4 4 4 1 1 7 1 1 1 4 4 4 4\n4 4 4 4 4 4 1 1 1 1 1 1 4 4 4 4 7 7 7 1 1 1 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 1 1 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 1 1 4 4 4 4\n1 1 1 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n1 1 1 4 4 4 4 1 1 1 1 1 1 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 1 1 4 4 4 4 3 3 3 3 3 1 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 6 6 4 4 4 4 1 1 1 1 3 1 4 4 4 4 4 4 4 1 1 1 1 1 1\n4 1 1 4 4 4 4 1 1 1 1 3 1 4 1 1 6 1 1 4 7 7 7 1 1 1\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 6 6 6 4 1 1 7 1 1 1\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 1 4 1 1 7 1 1 1\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 4 4 4 4 4 4 4 4\n4 4 1 7 1 1 4 4 4 4 4 4 4 4 1 7 7 7 4 4 4 4 4 4 4 4\n4 4 1 7 7 7 4 4 4 4 4 4 4 4 1 7 1 1 4 4 4 4 4 4 4 4\n4 4 1 1 1 1 4 4 4 4 4 4 4 4 1 7 1 1 4 4 4 4 4 4 4 4\n4 2 1 1 1 1 4 4 4 4 4 4 4 4 1 7 1 1 4 4 4 4 4 4 4 4\n4 2 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nTest Input 2:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 9 9 9 9 8 8 8 8 8 8 8 4 4 8\n8 8 8 8 8 8 3 3 9 9 8 8 8 8 8 9 9 9 4 8\n9 9 9 8 8 8 9 3 9 9 8 8 8 8 8 9 3 9 8 8\n9 3 3 8 8 8 3 3 3 3 8 8 8 8 8 3 3 9 8 8\n9 3 9 8 8 8 9 3 3 3 8 8 8 8 8 3 3 9 8 8\n9 3 3 8 8 8 3 3 9 9 8 8 8 8 8 8 8 8 8 8\n9 3 9 8 8 8 9 9 9 9 8 8 8 8 8 8 8 8 8 8\n9 3 3 8 8 8 8 8 8 8 8 8 8 9 9 9 8 8 8 8\n9 9 9 8 8 8 8 8 8 8 8 8 8 9 9 9 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 9 3 3 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 9 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 9 8 8 8 8\n8 8 8 9 9 9 8 8 8 8 8 8 8 9 3 3 8 8 8 8\n8 8 8 9 3 9 8 8 8 8 8 8 8 9 9 9 8 8 8 8\n8 8 8 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 9 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 9 3 3 8 8 8 8 8 3 3 9 8 8 8 8 8 8\n8 8 8 3 3 3 8 8 8 8 8 3 3 9 8 8 8 8 8 8\n8 8 8 9 9 9 8 8 8 8 8 9 9 9 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 7, + 7, + 7, + 7, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 1, + 1, + 1, + 1, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 1, + 1, + 1, + 1, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 1, + 1, + 1, + 1, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 1, + 1, + 1, + 1, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 7, + 7, + 7, + 7, + 7, + 7, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ] + ], + [ + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 3, + 3, + 3, + 9, + 9, + 9, + 9, + 9, + 9, + 3, + 9, + 9, + 3, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 9, + 9, + 3, + 9, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 3, + 3, + 3, + 3, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 3, + 3, + 3, + 3, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 3, + 3, + 3, + 9, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 8, + 8 + ], + [ + 8, + 8, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_4e34c42c.json b/problems/arc2_4e34c42c.json new file mode 100644 index 0000000..21c235a --- /dev/null +++ b/problems/arc2_4e34c42c.json @@ -0,0 +1,495 @@ +{ + "problem_id": "arc2_4e34c42c", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 1 8 8 2 8 2 3 3 3 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 4 1 1 1 2 2 2 3 2 3 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 1 8 8 2 8 2 3 3 3 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 8 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 1 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 1 4 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 1 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 8 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 2 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n6 8 9 8 8 8 8 8 8 8 8 8\n6 1 1 1 8 8 2 8 2 3 3 3\n6 1 4 1 1 1 2 2 2 3 2 3\n6 1 1 1 8 8 2 8 2 3 3 3\n6 8 9 8 8 8 8 8 8 8 8 8\n\nTraining Example 2:\nInput:\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 4 4 4\n4 4 4 4 4 4 4 4 4 4 8 1 1 1 3 3 1 4 4 4\n4 1 1 1 4 4 4 4 4 4 8 4 4 1 4 4 1 4 4 4\n4 1 2 1 4 4 4 4 4 4 8 1 1 1 3 3 1 4 4 4\n4 1 1 1 4 4 4 4 4 4 4 4 4 1 1 1 1 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 1 1 1 4 4 4 4 4 4 4 5 3 5 4 4\n4 4 4 4 4 1 2 1 3 3 3 3 3 3 3 3 5 3 4 4\n4 4 4 4 4 1 1 1 4 4 4 4 4 4 4 5 3 5 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 6 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 5 3 5 6 6 8 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 3 5 3 6 6 8 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 5 3 5 6 6 8 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 6 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nOutput:\n4 4 4 4 4 4 4 4 4 4 4 6 6 6 4 4 4 4 1 1 1 1\n1 1 1 4 4 4 4 4 4 4 5 3 5 6 6 8 1 1 1 3 3 1\n1 2 1 3 3 3 3 3 3 3 3 5 3 6 6 8 4 4 1 4 4 1\n1 1 1 4 4 4 4 4 4 4 5 3 5 6 6 8 1 1 1 3 3 1\n4 4 4 4 4 4 4 4 4 4 4 6 6 6 4 4 4 4 1 1 1 1\n\nTest Input 1:\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 6 6 1 1 1 1 3 3 3 3 3 3 3 3 6 6 3 3\n3 3 8 6 1 3 3 8 8 8 3 3 3 9 9 9 6 8 3 3\n3 3 6 6 1 1 1 1 7 8 3 3 3 9 3 3 6 6 3 3\n3 3 3 3 3 3 3 8 8 8 3 3 3 9 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 1 1 1 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 1 7 1 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 4 4 4 3 3 3 3 3 1 7 8 3 3 3 3 3 3 3 3\n3 3 4 3 3 3 3 3 3 8 8 8 3 3 3 3 3 3 3 3\n3 3 4 3 3 3 3 3 3 3 7 3 3 3 3 3 3 3 3 3\n3 1 1 1 3 3 3 3 3 3 7 3 3 3 3 3 3 3 3 3\n3 1 6 1 3 3 3 3 3 3 7 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 2 2 2 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 1 1 1 3 3 3 1 1 1 3 3\n3 3 3 3 2 3 2 3 3 1 6 1 3 3 3 1 7 1 3 3\n3 3 3 3 4 4 4 3 3 3 8 3 3 3 3 3 8 3 3 3\n3 3 3 4 4 1 4 4 3 3 8 3 3 3 3 3 8 3 3 3\n3 3 3 3 4 4 4 3 3 3 8 3 3 3 3 3 8 3 3 3\n3 3 3 3 3 3 3 3 3 3 8 8 8 8 8 8 8 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 2 3 2 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n\nTest Input 2:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 2 2 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 2 4 2 1 1 1 1 3 2 2 1 1 1\n1 1 1 1 1 1 1 2 2 2 1 1 1 1 1 2 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 2 2 1 1 1\n1 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 2 4 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 2 2 2 1 1 1 1 1 4 4 4 1 6 1 6 1 8 8 8\n1 1 3 1 1 1 1 1 1 4 7 4 8 8 8 8 8 8 7 8\n9 9 3 9 9 1 1 1 1 4 4 4 8 1 1 1 8 8 8 8\n1 9 9 9 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 6 1 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 8 8 8 3 3 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 8 7 8 3 3 1 1 1 1 1 1\n1 1 1 6 4 4 4 1 1 8 8 8 3 3 3 1 1 1 1 1\n1 6 6 6 4 7 4 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 6 4 4 4 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 3, + 3 + ], + [ + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 9, + 9, + 9, + 6, + 8, + 6, + 1, + 3, + 3, + 8, + 8, + 8 + ], + [ + 3, + 4, + 3, + 3, + 3, + 3, + 3, + 9, + 3, + 3, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 7, + 8 + ], + [ + 3, + 4, + 3, + 3, + 3, + 3, + 3, + 9, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8 + ], + [ + 1, + 1, + 1, + 3, + 3, + 3, + 1, + 1, + 1, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 7, + 3 + ], + [ + 1, + 6, + 1, + 3, + 3, + 3, + 1, + 7, + 1, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 7, + 3 + ], + [ + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 7, + 3 + ], + [ + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 2, + 2, + 2 + ], + [ + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 2, + 3, + 2, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 4, + 4, + 1, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ] + ], + [ + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 2, + 4, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 9, + 9, + 3, + 9, + 9, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 9, + 9, + 9, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 6, + 4, + 4, + 4, + 1, + 6, + 1, + 6, + 1, + 8, + 8, + 8, + 3, + 3, + 3, + 2, + 2 + ], + [ + 6, + 6, + 6, + 4, + 7, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 3, + 3, + 1, + 2, + 1 + ], + [ + 1, + 1, + 6, + 4, + 4, + 4, + 8, + 1, + 1, + 1, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 2, + 2 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_5dbc8537.json b/problems/arc2_5dbc8537.json new file mode 100644 index 0000000..33672c1 --- /dev/null +++ b/problems/arc2_5dbc8537.json @@ -0,0 +1,482 @@ +{ + "problem_id": "arc2_5dbc8537", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n9 4 4 4 4 4 9 4 4 4 4 4 4 4 4\n9 4 4 4 4 4 9 4 4 4 8 8 8 8 8\n9 9 4 4 9 9 9 4 4 4 8 8 8 8 8\n9 9 4 4 9 9 9 4 4 4 4 4 4 4 4\n9 9 4 4 9 9 9 4 3 3 4 1 1 4 4\n9 9 4 4 9 9 9 4 3 3 4 1 1 4 4\n9 9 4 4 4 9 9 4 3 3 4 4 4 4 4\n9 9 4 4 9 9 9 4 3 3 4 5 5 5 5\n9 4 4 9 9 9 9 4 3 3 4 4 4 4 4\n9 4 4 9 9 9 9 4 3 3 4 4 4 4 4\n9 9 4 4 4 4 9 4 4 4 4 4 4 7 7\n9 9 9 4 4 9 9 4 5 5 5 5 4 7 7\n9 9 9 4 4 9 9 4 4 4 4 4 4 7 7\n9 9 9 4 4 9 9 4 4 0 4 4 4 4 4\n9 9 4 4 4 4 9 4 4 4 4 4 4 4 4\n\nOutput:\n9 8 8 8 8 8 9\n9 8 8 8 8 8 9\n9 9 3 3 9 9 9\n9 9 3 3 9 9 9\n9 9 3 3 9 9 9\n9 9 3 3 9 9 9\n9 9 3 3 0 9 9\n9 9 3 3 9 9 9\n9 1 1 9 9 9 9\n9 1 1 9 9 9 9\n9 9 5 5 5 5 9\n9 9 9 7 7 9 9\n9 9 9 7 7 9 9\n9 9 9 7 7 9 9\n9 9 5 5 5 5 9\n\nTraining Example 2:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 4 7 4 7 4 7 8 8 8 6 6 8 8 8 8 8 8 8 8\n8 7 4 7 4 7 4 8 9 8 6 6 8 8 1 1 1 8 8 8\n8 4 7 4 7 4 7 8 9 8 6 6 8 8 1 9 1 8 8 8\n8 7 4 7 4 7 4 8 9 8 6 6 8 8 1 1 1 8 0 8\n8 8 8 8 8 8 8 8 9 8 6 6 8 8 1 9 1 8 8 8\n8 8 5 5 8 8 8 8 9 8 8 8 8 8 1 1 1 8 8 8\n8 8 5 5 8 8 8 8 8 8 8 8 8 8 8 8 8 8 0 8\n8 8 5 5 8 8 3 3 3 8 8 8 8 8 8 4 4 8 8 8\n8 8 5 5 8 8 3 3 3 8 8 8 8 8 8 4 4 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 8 2 2 2 2 2 8 8 2 2 2 2 2 2 2\n2 2 2 2 8 8 8 2 2 2 8 8 8 2 2 2 2 2 2 2\n8 8 8 8 8 8 8 2 2 2 8 8 8 8 8 8 8 8 8 2\n8 8 8 8 8 8 8 2 2 2 8 8 8 8 8 8 8 8 8 8\n2 2 8 8 8 8 8 2 2 2 8 2 2 8 8 8 8 8 8 2\n2 2 8 8 8 8 8 8 8 8 8 2 2 8 8 8 8 8 8 2\n2 2 8 8 2 2 2 8 8 8 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nOutput:\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 0 2 2 2 2 2 5 5 2 2 2 2 2 2 2\n2 2 2 2 1 1 1 2 2 2 9 5 5 2 2 2 2 2 2 2\n4 4 6 6 1 9 1 2 2 2 9 5 5 4 7 4 7 4 7 2\n4 4 6 6 1 1 1 2 2 2 9 5 5 7 4 7 4 7 4 0\n2 2 6 6 1 9 1 2 2 2 9 2 2 4 7 4 7 4 7 2\n2 2 6 6 1 1 1 3 3 3 9 2 2 7 4 7 4 7 4 2\n2 2 6 6 2 2 2 3 3 3 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nTest Input 1:\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 1 1 3 3 1 1 3 3 3 3 1 3 3 3 3 3 3 3 3 1 1 3\n1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1 3 3 1 3 1 1 1 1 3\n1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1 1 1 1 1 1 1 1 1 3\n1 1 1 1 1 3 3 1 1 3 3 1 1 1 1 1 1 1 1 1 1 1 1 1 3\n1 1 1 1 1 3 3 1 1 1 1 1 1 1 1 1 3 3 1 3 3 3 1 1 1\n1 1 1 1 1 3 1 1 1 1 1 1 1 1 1 1 3 3 3 3 3 3 1 1 1\n1 1 1 1 1 3 3 1 1 3 3 1 1 1 1 1 3 3 3 3 3 3 1 1 1\n1 1 1 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 1 1 1\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 9 9 1 1 1 1 6 6 6 6 6 1 1 1 4 4 1 1 2 2 2 1 1 1\n1 9 9 1 1 1 1 6 8 6 8 6 1 1 1 4 4 1 1 2 5 2 1 1 1\n1 9 9 1 1 1 1 6 6 8 6 6 1 1 1 4 4 1 1 2 2 2 1 1 1\n1 9 9 1 1 1 1 6 8 6 8 6 1 1 1 4 4 1 1 2 5 2 1 1 1\n1 9 9 1 1 1 1 6 6 8 6 6 1 1 1 4 4 1 1 2 2 2 1 1 1\n1 9 9 1 1 1 1 6 6 6 6 6 1 1 1 4 4 1 1 2 5 2 1 1 1\n1 9 9 1 4 4 1 1 1 1 1 1 1 1 1 9 9 1 1 2 2 2 1 1 1\n1 9 9 1 4 4 1 7 7 7 7 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 4 4 1 7 7 7 7 1 1 1 1 1 1 1 1 1 1 1 8 8 1\n1 1 1 1 4 4 1 1 1 1 1 1 1 1 5 5 1 1 1 6 1 1 8 8 1\n1 8 8 1 4 4 1 0 1 0 1 1 1 1 5 5 1 1 1 6 1 1 1 1 1\n1 8 8 1 4 4 1 1 1 1 1 1 1 1 5 5 1 1 1 6 1 1 1 1 1\n1 1 1 1 9 9 1 0 1 0 1 1 1 1 1 1 1 1 1 6 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTest Input 2:\n1 3 3 1 1 1 1 1 3 3 3 3 3 3 3 3 3 3 3 3\n1 1 3 3 1 1 1 1 3 4 7 4 7 3 9 9 9 8 3 3\n1 1 1 3 3 1 1 1 3 7 4 7 4 3 8 9 9 9 3 3\n1 1 1 1 3 3 1 1 3 4 7 4 7 3 3 3 3 3 3 3\n1 3 3 3 3 3 3 1 3 3 3 3 3 3 3 3 6 6 3 3\n1 3 3 3 3 3 3 1 3 6 6 3 3 3 3 3 6 6 3 3\n1 1 3 3 1 3 1 1 3 6 6 3 3 3 3 3 3 3 3 3\n1 1 3 3 1 1 1 1 3 3 3 3 3 5 5 3 3 3 3 3\n1 3 3 3 1 1 1 1 3 4 4 9 3 3 3 3 3 3 3 3\n1 3 3 3 1 1 1 1 3 9 4 4 3 3 3 5 5 3 3 3\n1 1 3 3 3 1 1 1 3 3 3 3 3 3 3 3 3 3 3 3\n1 1 1 3 3 3 3 1 3 3 8 8 8 3 3 3 3 3 3 3\n1 1 1 3 3 3 3 1 3 3 3 3 3 3 3 3 3 3 0 3\n1 3 3 3 3 1 1 1 3 3 2 2 2 2 2 2 3 3 3 3\n1 3 3 3 3 1 1 1 3 3 2 2 2 2 2 2 3 3 0 3\n1 3 3 3 3 1 1 1 3 3 3 3 3 3 3 3 3 3 3 3\n1 1 1 3 3 3 1 1 3 3 3 3 3 5 5 3 3 3 0 3\n1 1 1 3 3 1 1 1 3 4 4 9 3 3 3 3 3 3 3 3\n1 1 3 3 3 3 1 1 3 9 4 4 3 3 5 5 3 3 3 3\n1 1 3 3 3 1 1 1 3 3 3 3 3 3 3 3 3 3 3 3\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 4, + 4, + 3, + 3, + 4, + 4, + 3, + 3, + 3, + 3, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 3 + ], + [ + 2, + 2, + 2, + 4, + 4, + 8, + 8, + 4, + 4, + 3, + 3, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 0, + 3, + 5, + 5, + 9, + 9, + 3 + ], + [ + 2, + 5, + 2, + 4, + 4, + 8, + 8, + 4, + 4, + 3, + 3, + 6, + 8, + 6, + 8, + 6, + 7, + 7, + 7, + 7, + 5, + 5, + 9, + 9, + 3 + ], + [ + 2, + 2, + 2, + 4, + 4, + 3, + 3, + 4, + 4, + 3, + 3, + 6, + 6, + 8, + 6, + 6, + 7, + 7, + 7, + 7, + 5, + 5, + 9, + 9, + 3 + ], + [ + 2, + 5, + 2, + 4, + 4, + 3, + 3, + 4, + 4, + 8, + 8, + 6, + 8, + 6, + 8, + 6, + 3, + 3, + 0, + 3, + 3, + 3, + 9, + 9, + 6 + ], + [ + 2, + 2, + 2, + 4, + 4, + 3, + 0, + 4, + 4, + 8, + 8, + 6, + 6, + 8, + 6, + 6, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 6 + ], + [ + 2, + 5, + 2, + 9, + 9, + 3, + 3, + 9, + 9, + 3, + 3, + 6, + 6, + 6, + 6, + 6, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 6 + ], + [ + 2, + 2, + 2, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 9, + 9, + 6 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ] + ], + [ + [ + 1, + 5, + 5, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 5, + 5, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 5, + 5, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 5, + 5, + 1, + 1 + ], + [ + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 1 + ], + [ + 1, + 2, + 2, + 2, + 2, + 2, + 2, + 1 + ], + [ + 1, + 1, + 6, + 6, + 1, + 0, + 1, + 1 + ], + [ + 1, + 1, + 6, + 6, + 1, + 1, + 1, + 1 + ], + [ + 1, + 4, + 4, + 9, + 1, + 1, + 1, + 1 + ], + [ + 1, + 9, + 4, + 4, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 8, + 8, + 8, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 9, + 9, + 9, + 8, + 1 + ], + [ + 1, + 1, + 1, + 8, + 9, + 9, + 9, + 1 + ], + [ + 1, + 4, + 7, + 4, + 7, + 1, + 1, + 1 + ], + [ + 1, + 7, + 4, + 7, + 4, + 1, + 1, + 1 + ], + [ + 1, + 4, + 7, + 4, + 7, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 6, + 6, + 0, + 1, + 1 + ], + [ + 1, + 1, + 1, + 6, + 6, + 1, + 1, + 1 + ], + [ + 1, + 1, + 4, + 4, + 9, + 0, + 1, + 1 + ], + [ + 1, + 1, + 9, + 4, + 4, + 1, + 1, + 1 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_62593bfd.json b/problems/arc2_62593bfd.json new file mode 100644 index 0000000..c56b8d2 --- /dev/null +++ b/problems/arc2_62593bfd.json @@ -0,0 +1,1257 @@ +{ + "problem_id": "arc2_62593bfd", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n4 4 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 0 0 0 2 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 3 3 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 3 0 0 0 0 0 0 1 1 1 1 1 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 3 3 3 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 2 0 0 0 0 0 0 0 0 0 0\n4 4 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 2 2 2 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTraining Example 2:\nInput:\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 3 3 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 5 3 5 5 5 5 5\n5 5 5 5 5 5 1 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 3 3 5 5 5 5 5\n5 5 5 5 1 1 1 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 7 5 5 9 9 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 7 7 5 5 9 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 2 2 2 5 5 5 5 5 5 5 5 5 5 5 5 5 5 4 5 5 5 5 5 5 5 5\n5 5 5 5 2 5 2 2 5 5 5 5 5 5 5 5 5 5 5 5 5 4 5 5 5 5 5 5 5 5\n5 5 5 5 2 2 2 5 5 5 5 5 5 5 5 5 5 5 5 5 4 4 4 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n\nOutput:\n5 5 5 5 2 2 2 5 5 5 5 5 5 7 5 5 9 9 5 5 5 5 3 3 3 5 5 5 5 5\n5 5 5 5 2 5 2 2 5 5 5 5 7 7 5 5 9 5 5 5 5 5 3 5 3 5 5 5 5 5\n5 5 5 5 2 2 2 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 3 3 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 4 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 1 5 5 5 5 5 5 5 5 5 5 5 5 5 5 4 5 5 5 5 5 5 5 5\n5 5 5 5 1 1 1 5 5 5 5 5 5 5 5 5 5 5 5 5 4 4 4 5 5 5 5 5 5 5\n\nTest Input 1:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1 1 1 1 5 1 1 1 1 1\n1 1 1 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 5 5 5 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 5 1 5 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 5 5 5 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 5 1 1 1 5 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 3 1 1 1 3 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1 1\n1 1 1 1 1 3 3 3 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1 1\n1 1 1 1 1 3 1 3 1 1 1 1 1 1 1 1 1 1 3 3 3 1 1 1 1\n1 1 1 1 1 3 3 3 1 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1\n1 1 1 1 3 1 1 1 3 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 4 4 4 4 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTest Input 2:\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 3 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 3 9 3 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 4 4 4 9 9 9 9 9 3 9 9 9 9\n9 9 9 9 9 9 1 9 9 9 9 9 9 9 9 9 4 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 1 1 1 1 9 9 9 9 9 9 9 9 4 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 1 9 9 9 9 7 7 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 1 9 9 9 9 7 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 6 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 6 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 6 6 6 6 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 6 9 9 9 9 9\n9 9 8 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 8 8 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9 9\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 1, + 1, + 1, + 1, + 1, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 5, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 5, + 5, + 5, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 3, + 1, + 1, + 1, + 1, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 5, + 1, + 5, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 5, + 5, + 5, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 3, + 1, + 1, + 1, + 1, + 4, + 1, + 1, + 1, + 1, + 1, + 5, + 1, + 1, + 1, + 5, + 1 + ] + ], + [ + [ + 9, + 9, + 8, + 9, + 9, + 9, + 1, + 9, + 9, + 9, + 9, + 7, + 7, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 6, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 8, + 8, + 9, + 1, + 1, + 1, + 1, + 9, + 9, + 9, + 7, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 6, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 1, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 6, + 6, + 6, + 6, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 1, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 6, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4, + 4, + 4, + 9, + 9, + 9, + 9, + 9, + 3, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4, + 9, + 9, + 9, + 9, + 9, + 3, + 9, + 3, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 4, + 9, + 9, + 9, + 9, + 9, + 9, + 3, + 9, + 9, + 9, + 9 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_71e489b6.json b/problems/arc2_71e489b6.json new file mode 100644 index 0000000..8329bd0 --- /dev/null +++ b/problems/arc2_71e489b6.json @@ -0,0 +1,678 @@ +{ + "problem_id": "arc2_71e489b6", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n1 1 1 0 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 0 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 0 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 0 0 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 1 0 0 0 0 0 0 0 0\n0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 7 0 7 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 7 7 7 1 1 1 1 1 1 1 1 1 1 7 7\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 7 0\n1 1 1 1 1 1 1 7 7 7 1 1 1 1 1 7 7\n1 1 1 1 1 1 1 7 0 7 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 7 7 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 7 7 0 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 7 0 0 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 7 7 7 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 7 7 7 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 7 0 7 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 7 7 7 1\n\nTraining Example 2:\nInput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 1 0 0 0 1 1 1 1 1 1 0 1 1 1\n1 1 0 0 0 0 1 1 1 1 1 1 0 1 0 1\n1 1 0 0 0 0 1 1 0 1 1 1 0 1 1 1\n1 1 0 0 1 0 1 1 1 1 1 1 0 1 1 0\n1 1 0 0 0 0 1 1 1 1 1 1 0 1 1 1\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 0 0 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 7 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 7 7\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 0 0 0 0 1 1 1 1 1 1 0 7 7 7\n1 1 0 0 0 0 1 7 7 7 1 1 0 7 0 7\n1 1 0 0 0 0 1 7 0 7 1 1 0 7 7 7\n1 1 0 0 0 0 1 7 7 7 1 1 0 1 7 0\n1 1 0 0 0 0 1 1 1 1 1 1 0 1 7 7\n1 1 0 0 0 0 0 0 0 0 0 0 0 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 7 7 7 7 1 1 1 1 1 1 1\n1 1 1 1 1 7 0 0 7 1 1 1 1 1 1 1\n1 1 1 1 1 7 7 7 7 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTraining Example 3:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 1\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 0 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 0 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 0 1 1 1 1 1 1 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 7 7 7 1 1 0 0\n0 0 0 0 1 1 1 1 1 7 0 7 7 1 0 0\n0 0 0 0 1 1 1 1 1 7 7 0 7 1 0 0\n0 0 0 0 1 1 1 1 1 1 7 7 7 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 1 1 1 1 1 1 1 1 0 0\n0 0 0 0 1 1 7 7 7 1 1 1 1 1 0 0\n0 0 0 0 1 1 7 0 7 1 1 1 1 1 0 0\n0 0 0 0 0 0 7 7 7 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTest Input 1:\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 1 0 1 1 0 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 1\n1 1 1 1 1 0 1 1 1 1 1 1 1 1 0 0\n1 1 1 1 0 1 1 1 1 1 1 1 1 1 0 1\n1 1 1 0 1 1 1 1 1 1 1 1 1 1 0 0\n1 1 1 1 1 1 1 1 1 1 1 0 1 1 0 0\n1 1 1 1 1 1 1 1 1 1 1 0 1 1 1 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 0\n1 1 1 1 1 1 0 1 1 1 1 1 1 1 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 1 0 0 0\n1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 1\n\nTest Input 2:\n0 0 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 1 1 0 1 1 1 1 1 1 1 1 1 1 1 0 1 1\n0 0 1 1 1 1 1 1 1 0 0 0 0 0 0 0 0 0 0\n0 0 1 1 1 1 0 1 1 0 0 0 0 1 0 0 0 0 0\n0 0 1 1 1 1 1 1 1 0 0 0 0 0 0 0 0 0 0\n1 0 1 1 1 1 1 1 1 0 0 1 1 1 1 1 1 1 1\n0 0 1 1 1 1 1 1 1 0 0 1 1 1 1 1 1 1 1\n0 0 1 1 1 0 1 1 1 0 0 1 1 1 1 1 1 1 1\n0 0 1 1 0 1 0 1 1 0 0 1 1 1 0 1 1 1 1\n0 0 1 1 1 1 1 1 1 0 0 1 1 1 0 1 1 1 1\n0 0 1 1 1 1 1 1 1 0 0 1 1 1 1 1 1 1 1\n0 0 1 1 1 1 1 1 1 0 0 1 1 1 1 1 1 1 1\n0 0 0 1 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 1 0 0 1 1 1 1 1 1 1 0\n0 0 0 0 0 0 0 0 0 0 0 1 0 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 1 1 0 1 1 1 1 1\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 1, + 7, + 7, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 7, + 7, + 0, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0 + ], + [ + 1, + 1, + 7, + 7, + 0, + 7, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0 + ], + [ + 1, + 1, + 7, + 0, + 7, + 7, + 1, + 1, + 1, + 1, + 7, + 7, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 7, + 7, + 7, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 7, + 7, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 7, + 7, + 1 + ], + [ + 0, + 0, + 1, + 7, + 0, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 1 + ], + [ + 0, + 0, + 1, + 7, + 7, + 7, + 7, + 7, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0 + ], + [ + 0, + 0, + 1, + 1, + 1, + 7, + 0, + 7, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 1, + 1, + 7, + 7, + 7, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 7, + 7, + 0, + 7, + 7, + 1, + 0, + 0, + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 7, + 0, + 7, + 0, + 7, + 1, + 0, + 0, + 1, + 1, + 7, + 0, + 7, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 7, + 7, + 7, + 7, + 7, + 1, + 0, + 0, + 1, + 1, + 7, + 0, + 7, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 1, + 1, + 7, + 7, + 7, + 1, + 1, + 1 + ], + [ + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 1, + 1, + 1, + 7, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 7, + 7, + 1, + 1, + 7, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 0, + 7, + 1, + 1, + 1, + 1 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_88bcf3b4.json b/problems/arc2_88bcf3b4.json new file mode 100644 index 0000000..a0a7aa7 --- /dev/null +++ b/problems/arc2_88bcf3b4.json @@ -0,0 +1,1323 @@ +{ + "problem_id": "arc2_88bcf3b4", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0\n0 0 0 0 0 2 0\n0 0 0 0 0 0 0\n0 0 0 4 4 8 0\n0 0 0 4 0 8 0\n0 0 4 4 0 8 0\n0 4 0 0 0 8 0\n\nOutput:\n0 0 0 0 0 4 0\n0 0 0 0 4 2 0\n0 0 0 0 4 0 0\n0 0 0 0 4 8 0\n0 0 0 0 0 8 0\n0 0 0 0 0 8 0\n0 0 0 0 0 8 0\n\nTraining Example 2:\nInput:\n7 7 7 7 4 7 7 7 7 7 7 7\n7 7 7 7 4 7 7 7 7 7 7 7\n7 7 7 7 4 7 7 7 7 7 7 7\n7 7 7 7 7 7 7 7 7 7 7 7\n7 7 7 7 7 7 7 7 7 7 7 7\n7 7 7 7 7 7 3 2 7 7 7 7\n7 7 7 7 7 3 7 2 7 7 7 7\n7 7 7 7 7 3 7 2 7 7 7 7\n7 7 7 3 3 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n\nOutput:\n7 7 7 7 4 7 7 7 7 7 7 7\n7 7 7 3 4 7 7 7 7 7 7 7\n7 7 7 3 4 7 7 7 7 7 7 7\n7 7 7 7 3 7 7 7 7 7 7 7\n7 7 7 7 7 3 7 7 7 7 7 7\n7 7 7 7 7 7 3 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n7 7 7 7 7 7 7 2 7 7 7 7\n\nTraining Example 3:\nInput:\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 7 7 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 7 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 7 7 1 1 1 1\n1 1 1 1 1 1 2 1 7 7 7 1 1 1 1 1 1\n1 1 1 1 1 1 2 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 2 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 7 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 7 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 7 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 7 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 9 7 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 7 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 7 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 7 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTraining Example 4:\nInput:\n0 0 0 0 0 0 0 0 0 0\n0 0 0 3 0 0 0 0 0 0\n0 0 3 0 0 0 0 0 0 0\n0 0 0 3 0 0 0 0 0 0\n0 0 0 8 5 0 0 0 0 0\n0 0 0 8 5 0 0 0 0 0\n0 0 8 0 5 0 0 0 0 0\n0 0 8 0 5 0 0 0 0 0\n0 8 8 0 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n\nOutput:\n0 0 0 8 0 0 0 0 0 0\n0 0 8 3 0 0 0 0 0 0\n0 8 3 0 0 0 0 0 0 0\n0 0 8 3 0 0 0 0 0 0\n0 0 0 8 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n\nTraining Example 5:\nInput:\n0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0\n0 0 0 3 0 0 0 0 0\n0 0 0 3 0 0 0 0 0\n0 0 0 0 0 0 0 0 0\n0 0 0 0 9 6 0 0 0\n0 0 0 9 0 6 0 0 0\n9 9 9 0 0 6 0 0 0\n9 0 0 0 0 6 0 0 0\n\nOutput:\n0 0 0 0 9 0 0 0 0\n0 0 0 9 0 0 0 0 0\n0 0 9 3 0 0 0 0 0\n0 0 9 3 0 0 0 0 0\n0 0 0 9 0 0 0 0 0\n0 0 0 0 9 6 0 0 0\n0 0 0 0 0 6 0 0 0\n0 0 0 0 0 6 0 0 0\n0 0 0 0 0 6 0 0 0\n\nTest Input 1:\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 8 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 8 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 8 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 8 5 5 5 5 5 5 5 9 9 5 5 5 5 5 5 5 5 5 5\n5 5 5 8 5 5 5 5 5 5 9 9 9 5 5 5 5 5 5 5 5 5\n5 5 5 5 8 5 5 5 5 5 9 9 9 9 5 5 5 5 5 5 5 5\n5 5 5 5 5 8 8 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n3 3 3 3 3 3 3 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 4 4 1 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 4 4 4 5 5 1 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 4 5 5 5 5 5 1 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 1 5 5 5 5 5 5 5 5 5 5 5 5 5\n\nTest Input 2:\n8 8 8 8 8 8 8 8 8 8 8 8 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 1 1 1 8 8 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 1 8 8 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 1 1 1 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 1 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 9 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 2 2 2 2 2\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 5 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 6 8 8 8 8 5 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 6 6 8 8 8 5 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 5 5 8 8 8\n8 8 8 8 5 5 5 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 5 5 8 8\n8 8 8 8 5 5 5 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 4 4 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 4 4 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 8, + 8, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 8, + 9, + 9, + 8, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 8, + 5, + 9, + 9, + 9, + 8, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 8, + 5, + 5, + 9, + 9, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 8, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 6, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 4, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ] + ], + [ + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 5, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 5, + 6, + 6, + 8, + 8, + 5, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 5, + 6, + 6, + 5, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 5, + 5, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 4, + 5, + 5, + 5, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 4, + 5, + 5, + 5, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 4, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_88e364bc.json b/problems/arc2_88e364bc.json new file mode 100644 index 0000000..a242321 --- /dev/null +++ b/problems/arc2_88e364bc.json @@ -0,0 +1,892 @@ +{ + "problem_id": "arc2_88e364bc", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n7 7 7 7 7 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n7 1 1 2 7 0 0 0 0 0 0 0 0 0 0 5 2 1 1 5\n7 7 7 7 7 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n7 1 1 2 7 0 0 0 0 0 0 0 0 0 0 5 2 1 1 5\n7 7 7 7 7 0 0 0 7 7 7 7 7 0 0 5 5 5 5 5\n0 0 0 0 0 0 0 7 7 0 0 0 7 0 0 0 0 0 0 0\n0 0 0 0 0 0 7 7 0 4 0 0 7 0 0 0 0 0 0 0\n0 7 7 7 7 7 7 0 0 0 7 7 7 0 0 5 5 5 5 0\n0 7 0 0 0 0 0 0 0 7 7 0 0 5 5 5 0 0 5 0\n0 7 0 0 0 0 0 0 0 7 5 5 5 5 0 0 0 0 5 0\n0 7 7 0 4 0 0 0 0 7 5 0 0 0 0 0 0 5 5 0\n0 0 7 7 7 7 0 0 0 7 5 0 0 0 0 0 0 5 0 0\n0 0 0 0 0 7 7 7 7 7 5 0 0 0 0 4 0 5 0 0\n0 0 0 0 0 0 0 5 5 5 5 0 0 0 0 0 0 5 0 0\n0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 5 5 0\n0 5 0 0 4 0 5 0 0 0 0 0 0 0 0 0 0 0 5 0\n0 5 0 0 0 0 5 0 0 0 0 0 0 4 0 0 0 0 5 0\n0 5 5 0 0 0 5 5 0 0 0 0 0 0 0 0 0 5 5 0\n0 0 5 0 5 5 5 5 5 5 5 5 5 5 5 5 5 5 0 0\n0 0 5 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0\n\nOutput:\n7 7 7 7 7 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n7 1 1 2 7 0 0 0 0 0 0 0 0 0 0 5 2 1 1 5\n7 7 7 7 7 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n7 1 1 2 7 0 0 0 0 0 0 0 0 0 0 5 2 1 1 5\n7 7 7 7 7 0 0 0 7 7 7 7 7 0 0 5 5 5 5 5\n0 0 0 0 0 0 0 7 7 0 0 0 7 0 0 0 0 0 0 0\n0 0 0 0 0 0 7 7 0 0 0 4 7 0 0 0 0 0 0 0\n0 7 7 7 7 7 7 0 0 0 7 7 7 0 0 5 5 5 5 0\n0 7 0 0 0 0 0 0 0 7 7 0 0 5 5 5 0 0 5 0\n0 7 0 0 0 0 0 0 0 7 5 5 5 5 0 0 0 0 5 0\n0 7 7 0 0 0 0 0 4 7 5 0 0 0 0 0 0 5 5 0\n0 0 7 7 7 7 0 0 0 7 5 0 0 0 0 0 0 5 0 0\n0 0 0 0 0 7 7 7 7 7 5 4 0 0 0 0 0 5 0 0\n0 0 0 0 0 0 0 5 5 5 5 0 0 0 0 0 0 5 0 0\n0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 5 5 0\n0 5 4 0 0 0 5 0 0 0 0 0 0 0 0 0 0 0 5 0\n0 5 0 0 0 0 5 4 0 0 0 0 0 0 0 0 0 0 5 0\n0 5 5 0 0 0 5 5 0 0 0 0 0 0 0 0 0 5 5 0\n0 0 5 0 5 5 5 5 5 5 5 5 5 5 5 5 5 5 0 0\n0 0 5 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 1 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 5 1 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 1 5 5 2 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 2 5 5 5\n0 0 0 0 0 0 5 5 5 5 0 0 0 5 5 5 5 5 5 5\n0 0 0 0 0 5 5 0 0 5 5 0 0 0 0 0 0 0 0 0\n0 0 5 5 5 5 0 0 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 5 5 5 5 0 0 0 0\n0 0 5 4 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 5 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 0 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 0 0 0 0 5 5 5 0 0 4 0 0 5 5 0 0 0 0\n0 5 5 0 5 5 5 0 5 0 0 0 0 5 5 0 0 0 0 0\n0 0 5 5 5 0 0 0 5 0 0 0 5 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 1 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 5 1 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 1 5 5 2 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 2 5 5 5\n0 0 0 0 0 0 5 5 5 5 0 0 0 5 5 5 5 5 5 5\n0 0 0 0 0 5 5 0 0 5 5 0 0 0 0 0 0 0 0 0\n0 0 5 5 5 5 0 0 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 5 5 5 5 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 4 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 0 5 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 5 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 0 0 0 0 5 5 0 0 0 0 0 0 0 5 0 0 0 0\n0 5 0 0 0 0 5 5 5 0 0 0 0 0 5 5 0 0 0 0\n0 5 5 0 5 5 5 0 5 0 0 0 4 5 5 0 0 0 0 0\n0 0 5 5 5 0 0 0 5 0 0 0 5 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTraining Example 3:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 1 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 1 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 2 5 2 5\n0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 5 5 5 5 5\n0 0 0 0 5 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0\n0 0 0 0 5 4 0 0 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0 0 0 5 0 0 0 0 0 0 0\n0 0 5 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0\n0 0 5 0 0 5 5 5 5 0 0 0 0 5 5 0 0 0 0 0\n0 0 5 5 5 5 0 0 5 5 5 5 5 5 5 5 5 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0\n0 0 5 5 0 0 4 0 0 0 4 0 0 0 0 0 5 0 0 0\n0 0 0 5 5 0 0 0 0 0 0 0 0 5 5 0 5 0 0 0\n0 0 0 0 5 0 0 5 5 0 0 0 5 5 5 5 5 0 0 0\n0 0 0 0 5 0 0 5 5 5 0 0 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 5 0 5 5 0 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 5 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 1 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 1 5 1 5\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 2 5 2 5\n0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 5 5 5 5 5\n0 0 0 0 5 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0 0 0 5 0 0 0 0 0 0 0\n0 0 5 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0\n0 0 5 0 0 4 0 0 0 0 0 0 0 5 5 0 0 0 0 0\n0 0 5 0 0 5 5 5 5 0 0 0 0 5 5 0 0 0 0 0\n0 0 5 5 5 5 0 0 5 5 5 5 5 5 5 5 5 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0\n0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0\n0 0 0 5 5 0 0 0 0 0 0 0 0 5 5 0 5 0 0 0\n0 0 0 0 5 0 0 5 5 0 0 0 5 5 5 5 5 0 0 0\n0 0 0 0 5 0 0 5 5 5 4 0 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 5 0 5 5 0 5 0 0 0 0 0 0 0\n0 0 0 0 5 0 4 5 0 0 5 5 5 0 0 0 0 0 0 0\n0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTest Input 1:\n5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0\n5 5 5 1 5 5 5 0 0 5 5 5 0 0 0 0 0 0 0 0\n5 1 5 5 1 5 5 0 0 5 0 5 5 5 0 0 0 0 0 0\n5 5 1 5 5 2 5 0 0 5 0 4 0 5 0 0 5 5 0 0\n5 5 5 2 5 5 5 0 0 5 0 0 0 5 5 5 5 5 5 0\n5 5 5 5 5 5 5 0 0 5 0 0 0 0 0 0 0 0 5 0\n0 0 0 0 0 0 0 0 0 5 0 4 0 0 0 0 0 0 5 0\n0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 5 0\n0 0 0 0 0 1 1 1 1 1 5 0 0 0 0 0 0 0 5 0\n0 0 0 0 0 1 0 0 0 1 5 5 5 0 0 5 5 5 5 0\n0 0 0 0 0 1 0 0 0 1 1 1 5 5 5 5 0 0 0 0\n0 0 0 0 0 1 1 0 0 0 0 1 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 1 1 0 4 0 1 1 1 1 1 1 0 0 0\n0 0 0 0 0 0 0 0 1 0 0 0 0 1 0 0 1 1 0 0\n0 0 0 0 0 0 0 0 1 1 0 0 0 1 0 0 0 1 1 0\n1 1 1 1 1 0 0 0 0 1 1 1 1 1 0 0 0 0 1 0\n1 2 1 2 1 0 0 0 0 1 0 0 0 0 0 0 0 0 1 0\n1 5 1 5 1 0 0 0 0 1 0 0 0 0 0 0 4 0 1 0\n1 5 1 5 1 0 0 0 0 1 1 4 1 1 1 1 1 1 1 0\n1 1 1 1 1 0 0 0 0 0 1 1 1 0 0 0 0 0 0 0\n\nTest Input 2:\n6 6 6 6 6 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n6 2 6 2 6 0 0 3 3 3 3 3 3 3 0 0 6 6 6 6\n6 1 6 1 6 0 0 3 0 0 0 0 0 3 0 0 6 0 0 6\n6 1 6 1 6 0 3 3 0 0 0 0 0 3 6 6 6 6 0 6\n6 6 6 6 6 0 3 0 0 0 0 0 3 3 6 0 0 0 0 6\n0 0 0 0 0 0 3 0 0 0 0 0 3 0 6 0 4 0 0 6\n0 0 3 3 3 3 3 0 0 0 0 0 3 3 6 6 6 0 0 6\n0 0 3 0 0 0 0 0 0 4 0 0 0 3 3 0 6 0 0 6\n0 0 3 3 0 0 0 0 0 0 0 4 0 3 3 0 6 0 4 6\n0 0 0 3 3 3 3 3 3 3 3 3 3 3 0 0 6 6 0 6\n0 0 0 0 3 3 3 3 3 3 3 0 0 0 0 0 0 6 6 6\n0 0 0 0 3 0 0 0 0 0 3 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 0 0 0 0 0 3 0 0 0 0 0 0 0 0 0\n0 0 0 3 3 0 4 0 0 0 3 0 0 0 0 0 0 0 0 0\n0 0 3 3 0 0 0 0 0 0 3 0 0 3 3 3 3 3 3 3\n0 0 3 0 0 0 0 0 0 3 3 0 0 3 3 3 2 3 3 3\n0 0 3 0 0 0 0 0 0 3 0 0 0 3 2 3 3 1 3 3\n0 0 3 3 0 4 0 0 0 3 0 0 0 3 3 1 3 3 1 3\n0 0 0 3 3 3 0 0 3 3 0 0 0 3 3 3 1 3 3 3\n0 0 0 0 0 3 3 3 3 0 0 0 0 3 3 3 3 3 3 3\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 5, + 5, + 5, + 1, + 5, + 5, + 5, + 0, + 0, + 5, + 5, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 5, + 1, + 5, + 5, + 1, + 5, + 5, + 0, + 0, + 5, + 0, + 5, + 5, + 5, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 5, + 5, + 1, + 5, + 5, + 2, + 5, + 0, + 0, + 5, + 0, + 0, + 0, + 5, + 0, + 0, + 5, + 5, + 0, + 0 + ], + [ + 5, + 5, + 5, + 2, + 5, + 5, + 5, + 0, + 0, + 5, + 0, + 0, + 4, + 5, + 5, + 5, + 5, + 5, + 5, + 0 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 0, + 0, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 1, + 5, + 5, + 5, + 0, + 4, + 5, + 5, + 5, + 5, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 1, + 1, + 1, + 5, + 5, + 5, + 5, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 0, + 4, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 1, + 1, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 0, + 0, + 1, + 0, + 0, + 4, + 1, + 1, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 1, + 0 + ], + [ + 1, + 2, + 1, + 2, + 1, + 0, + 0, + 0, + 0, + 1, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0 + ], + [ + 1, + 5, + 1, + 5, + 1, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0 + ], + [ + 1, + 5, + 1, + 5, + 1, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0 + ], + [ + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 6, + 6, + 6, + 6, + 6, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 6, + 2, + 6, + 2, + 6, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 6, + 6, + 6, + 6 + ], + [ + 6, + 1, + 6, + 1, + 6, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 6, + 0, + 4, + 6 + ], + [ + 6, + 1, + 6, + 1, + 6, + 0, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 6, + 6, + 6, + 6, + 0, + 6 + ], + [ + 6, + 6, + 6, + 6, + 6, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 3, + 3, + 6, + 0, + 4, + 0, + 0, + 6 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 3, + 0, + 6, + 0, + 0, + 0, + 0, + 6 + ], + [ + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 6, + 6, + 6, + 0, + 0, + 6 + ], + [ + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 0, + 6, + 0, + 0, + 6 + ], + [ + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 0, + 6, + 0, + 0, + 6 + ], + [ + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 6, + 6, + 0, + 6 + ], + [ + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6 + ], + [ + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 0, + 0, + 3, + 3, + 3, + 2, + 3, + 3, + 3 + ], + [ + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 3, + 2, + 3, + 3, + 1, + 3, + 3 + ], + [ + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 3, + 3, + 1, + 3, + 3, + 1, + 3 + ], + [ + 0, + 0, + 0, + 3, + 3, + 3, + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 3, + 3, + 3, + 1, + 3, + 3, + 3 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_8b7bacbf.json b/problems/arc2_8b7bacbf.json new file mode 100644 index 0000000..dcbc6ba --- /dev/null +++ b/problems/arc2_8b7bacbf.json @@ -0,0 +1,1588 @@ +{ + "problem_id": "arc2_8b7bacbf", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 0 0\n0 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 5 0\n2 0 0 2 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 5 0 0 5 0\n2 0 0 2 0 0 0 0 2 0 0 2 0 0 0 0 0 0 0 1 5 5 1 0\n0 2 2 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 1 0 0 0 1 0\n0 0 0 0 1 1 1 1 1 2 2 1 0 0 0 0 2 0 2 2 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 2 0 0 0 0 2 0 1 0\n0 0 0 0 0 0 1 1 1 1 1 0 0 0 0 0 2 0 0 2 2 0 1 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 1 2 2 0 0 0 1 0\n0 0 0 1 1 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 3 3 0 0 0 0 0 0 0 1 0 0 0 0 0 1 0\n0 0 0 0 0 0 3 0 0 3 0 0 0 2 2 1 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 3 0 0 3 0 0 2 0 0 2 0 0 0 0 0 0 1 0\n0 0 0 1 0 0 1 3 3 1 1 1 2 0 0 2 0 0 0 0 0 0 1 0\n0 0 0 1 1 1 0 0 0 0 0 2 0 0 0 2 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 2 0 0 2 0 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 7\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 0 0\n0 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 7 7 5 0\n2 0 0 2 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 5 7 7 5 0\n2 0 0 2 0 0 0 0 2 0 0 2 0 0 0 0 0 0 0 1 5 5 1 0\n0 2 2 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 1 0 0 0 1 0\n0 0 0 0 1 1 1 1 1 2 2 1 0 0 0 0 2 7 2 2 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 2 7 7 7 7 2 0 1 0\n0 0 0 0 0 0 1 1 1 1 1 0 0 0 0 0 2 7 7 2 2 0 1 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 1 2 2 0 0 0 1 0\n0 0 0 1 1 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 3 3 0 0 0 0 0 0 0 1 0 0 0 0 0 1 0\n0 0 0 0 0 0 3 7 7 3 0 0 0 2 2 1 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 3 7 7 3 0 0 2 7 7 2 0 0 0 0 0 0 1 0\n0 0 0 1 0 0 1 3 3 1 1 1 2 7 7 2 0 0 0 0 0 0 1 0\n0 0 0 1 1 1 0 0 0 0 0 2 7 7 7 2 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 2 7 7 2 0 0 0 0 0 0 0 1 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 7\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 2 2 0 0\n0 0 0 2 2 0 2 0 0 2 0 0 0 0 0 2 0 0 2 0\n0 0 2 0 0 2 2 0 0 2 0 0 2 2 0 2 0 0 2 0\n0 0 2 0 0 2 1 2 2 0 0 2 0 0 2 0 2 2 1 0\n0 0 0 2 2 1 1 1 0 0 0 2 0 0 2 0 0 1 0 0\n0 0 0 1 0 0 0 0 1 1 0 0 2 2 0 0 1 0 0 0\n0 0 0 1 0 0 0 0 0 1 1 0 0 0 0 1 0 0 0 0\n0 0 1 1 0 0 0 0 0 0 1 1 0 0 1 0 0 0 0 0\n0 0 1 0 0 0 0 0 0 0 0 1 1 1 0 0 0 2 2 0\n1 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 2\n4 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 2\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 2 2 0 0\n0 0 0 2 2 0 2 4 4 2 0 0 0 0 0 2 4 4 2 0\n0 0 2 4 4 2 2 4 4 2 0 0 2 2 0 2 4 4 2 0\n0 0 2 4 4 2 1 2 2 0 0 2 0 0 2 0 2 2 1 0\n0 0 0 2 2 1 1 1 0 0 0 2 0 0 2 0 0 1 0 0\n0 0 0 1 0 0 0 0 1 1 0 0 2 2 0 0 1 0 0 0\n0 0 0 1 0 0 0 0 0 1 1 0 0 0 0 1 0 0 0 0\n0 0 1 1 0 0 0 0 0 0 1 1 0 0 1 0 0 0 0 0\n0 0 1 0 0 0 0 0 0 0 0 1 1 1 0 0 0 2 2 0\n1 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 2\n4 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 2\n\nTraining Example 3:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2\n0 0 2 2 0 0 0 0 0 0 0 2 2 0 0 0 0 2 0 0\n0 2 0 0 2 0 0 0 0 0 2 0 0 2 0 0 0 2 0 0\n0 2 0 0 2 0 0 0 0 0 2 0 0 2 0 0 0 3 2 2\n0 1 2 2 1 1 1 1 1 1 1 2 2 1 0 0 0 3 0 0\n0 1 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 3 0 0\n0 0 1 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 3 0\n1 1 0 0 0 0 0 2 2 1 1 1 0 0 0 0 2 2 3 0\n0 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 0 0 2 0\n1 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 0 0 2 0\n0 0 0 0 0 0 1 2 2 0 0 0 0 0 0 3 2 2 0 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 3 0 0 0 0\n0 0 0 0 1 0 0 0 0 0 0 3 3 2 2 3 0 0 0 0\n0 0 2 2 1 0 0 0 0 0 3 0 2 0 0 2 0 0 0 0\n0 2 0 0 2 0 0 0 3 3 3 0 2 0 0 2 0 0 0 0\n0 2 0 0 2 0 0 0 3 4 3 0 0 2 2 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2\n0 0 2 2 0 0 0 0 0 0 0 2 2 0 0 0 0 2 4 4\n0 2 0 0 2 0 0 0 0 0 2 0 0 2 0 0 0 2 4 4\n0 2 0 0 2 0 0 0 0 0 2 0 0 2 0 0 0 3 2 2\n0 1 2 2 1 1 1 1 1 1 1 2 2 1 0 0 0 3 0 0\n0 1 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 3 0 0\n0 0 1 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 3 0\n1 1 0 0 0 0 0 2 2 1 1 1 0 0 0 0 2 2 3 0\n0 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 4 4 2 0\n1 1 0 0 0 0 2 0 0 2 0 0 0 0 0 2 4 4 2 0\n0 0 0 0 0 0 1 2 2 0 0 0 0 0 0 3 2 2 0 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 3 0 0 0 0\n0 0 0 0 1 0 0 0 0 0 0 3 3 2 2 3 0 0 0 0\n0 0 2 2 1 0 0 0 0 0 3 0 2 4 4 2 0 0 0 0\n0 2 0 0 2 0 0 0 3 3 3 0 2 4 4 2 0 0 0 0\n0 2 0 0 2 0 0 0 3 4 3 0 0 2 2 0 0 0 0 0\n\nTraining Example 4:\nInput:\n0 0 2 2 0 0 0 0\n0 2 0 0 2 0 0 0\n0 2 0 0 2 0 0 0\n0 0 2 2 0 1 0 0\n0 0 0 0 0 0 1 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 0 1 1\n0 0 0 0 0 0 1 4\n\nOutput:\n0 0 2 2 0 0 0 0\n0 2 4 4 2 0 0 0\n0 2 4 4 2 0 0 0\n0 0 2 2 0 1 0 0\n0 0 0 0 0 0 1 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 0 1 1\n0 0 0 0 0 0 1 4\n\nTest Input 1:\n6 1 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 8\n1 1 1 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 3\n5 5 5 1 9 9 1 1 1 1 1 1 1 9 9 9 9 9 9 9 5 5 5 5 5 5 3 3 5 5\n5 5 5 9 5 5 9 5 5 5 5 5 9 5 5 5 5 5 5 5 9 5 5 5 5 5 3 5 5 5\n5 5 5 9 5 5 9 5 5 5 5 5 9 5 5 5 5 5 5 5 9 5 5 5 5 3 3 5 5 5\n5 5 5 5 9 9 5 5 5 5 5 5 5 9 9 9 9 9 9 9 1 1 1 1 5 3 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 1 3 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 1 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 5 5 1 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 9 3 5 5 1 5 5\n5 5 5 5 9 9 9 9 9 9 9 5 5 5 5 5 9 3 3 5 5 9 5 5 9 5 5 1 5 5\n5 5 5 9 5 5 5 5 5 5 5 9 5 5 5 9 9 9 3 3 3 9 5 5 9 5 5 1 5 5\n5 5 5 9 5 5 5 5 5 5 5 9 5 5 5 9 5 9 5 5 3 3 9 9 5 5 5 1 1 5\n5 5 3 3 9 9 9 9 9 9 9 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 5 5 1 5\n5 0 3 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 5 5 1 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 5 1 1 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 5 1 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 5 1 5 5\n5 5 0 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 1 1 5 5\n5 5 3 5 5 5 5 5 5 5 5 5 5 5 5 9 5 9 5 5 5 5 5 5 5 5 1 5 5 5\n5 5 3 5 5 5 5 5 5 5 5 5 5 3 3 3 9 5 5 5 5 5 5 5 5 1 1 5 5 5\n5 5 3 3 5 5 5 5 5 5 3 3 3 3 5 5 5 5 5 5 9 9 9 1 1 1 5 5 5 5\n5 5 5 3 9 9 3 3 3 3 3 5 5 5 5 5 5 5 5 9 5 5 9 1 1 5 5 5 5 5\n5 5 5 9 5 5 9 5 5 5 5 5 5 5 5 5 5 5 9 5 5 5 9 5 5 5 5 5 5 5\n5 5 5 9 5 5 9 5 5 5 5 5 5 5 5 5 5 9 5 5 5 9 5 5 5 5 5 5 5 5\n5 5 5 5 9 9 5 5 5 5 5 5 5 5 5 5 9 5 5 5 9 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 5 5 5 9 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 9 9 9 9 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n\nTest Input 2:\n0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 0 0 0 0 0 0 0 0 8 8 0\n0 0 0 0 0 0 0 1 1 0 0 0 0 0 1 1 1 0 0 0 0 0 8 0 0 8\n0 0 0 0 2 2 1 1 0 0 0 0 0 0 0 0 1 1 8 8 0 0 8 0 0 8\n0 0 0 2 0 0 2 0 0 0 0 0 0 0 0 0 0 8 0 0 8 0 0 8 8 0\n0 0 0 2 0 0 2 0 0 0 0 0 0 0 0 0 0 8 0 0 8 0 0 0 0 0\n0 0 0 1 2 2 1 0 0 0 0 0 0 0 0 0 0 0 8 8 1 0 0 0 0 0\n0 0 1 1 0 0 1 1 6 6 6 0 0 0 0 0 0 0 0 0 0 1 1 1 0 0\n0 0 1 0 0 0 0 6 0 0 0 6 0 0 0 8 8 0 0 0 0 0 0 0 1 0\n0 0 1 0 0 0 0 6 0 0 0 6 0 0 8 0 0 8 0 0 0 5 5 5 1 0\n0 0 1 0 0 0 0 6 0 0 0 6 0 0 8 0 0 8 0 0 5 0 0 0 5 0\n0 0 1 0 0 0 0 0 6 6 6 0 0 9 9 8 8 9 0 0 5 0 0 0 5 0\n0 0 1 0 0 0 0 0 0 0 0 0 9 0 0 0 0 9 9 0 0 5 5 5 0 0\n0 0 1 0 0 0 0 0 8 8 9 9 0 0 0 0 0 0 9 0 0 0 0 0 0 0\n0 0 1 0 0 0 0 8 0 0 8 0 0 0 0 0 0 0 9 0 0 0 0 0 0 0\n0 0 1 0 0 0 0 8 0 0 8 0 0 0 0 0 0 0 9 0 0 0 0 0 0 0\n0 0 1 0 0 0 0 0 8 8 0 0 0 0 0 0 0 0 9 0 0 0 8 8 0 0\n0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 8 8 9 0 0 8 0 0 8 0\n0 1 1 0 0 0 0 0 0 0 0 0 0 0 0 8 0 0 8 0 0 8 0 0 8 0\n0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 8 0 0 8 0 0 9 8 8 0 0\n0 1 0 0 0 0 0 9 9 9 9 0 0 0 0 9 8 8 9 9 9 0 0 0 0 0\n1 1 0 0 9 9 9 0 0 0 9 9 9 9 9 9 0 0 0 0 0 0 0 0 0 0\n4 1 0 0 9 3 9 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 6, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 8 + ], + [ + 1, + 1, + 1, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 3 + ], + [ + 5, + 5, + 5, + 1, + 9, + 9, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 3, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 3, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 3, + 3, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 1, + 1, + 1, + 1, + 5, + 3, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 3, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 1, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 9, + 3, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 9, + 3, + 3, + 5, + 5, + 9, + 8, + 8, + 9, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 5, + 5, + 5, + 9, + 9, + 9, + 3, + 3, + 3, + 9, + 8, + 8, + 9, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 3, + 3, + 9, + 9, + 5, + 5, + 5, + 1, + 1, + 5 + ], + [ + 5, + 5, + 3, + 3, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5 + ], + [ + 5, + 0, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 1, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5 + ], + [ + 5, + 5, + 0, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 1, + 5, + 5 + ], + [ + 5, + 5, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 5, + 5, + 5 + ], + [ + 5, + 5, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 3, + 3, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 1, + 1, + 5, + 5, + 5 + ], + [ + 5, + 5, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 9, + 9, + 1, + 1, + 1, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 3, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 9, + 1, + 1, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 8, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 9, + 8, + 8, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 6, + 6, + 6, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 9, + 9, + 9, + 9, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ], + [ + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5, + 5 + ] + ], + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 8, + 0, + 0, + 8 + ], + [ + 0, + 0, + 0, + 0, + 2, + 2, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 8, + 8, + 0, + 0, + 8, + 0, + 0, + 8 + ], + [ + 0, + 0, + 0, + 2, + 4, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 4, + 4, + 8, + 0, + 0, + 8, + 8, + 0 + ], + [ + 0, + 0, + 0, + 2, + 4, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 4, + 4, + 8, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 1, + 2, + 2, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 1, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 1, + 0, + 0, + 1, + 1, + 6, + 6, + 6, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 1, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 6, + 4, + 4, + 4, + 6, + 0, + 0, + 0, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 6, + 4, + 4, + 4, + 6, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 0, + 5, + 5, + 5, + 1, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 6, + 4, + 4, + 4, + 6, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 5, + 4, + 4, + 4, + 5, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 0, + 0, + 9, + 9, + 8, + 8, + 9, + 0, + 0, + 5, + 4, + 4, + 4, + 5, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 0, + 0, + 5, + 5, + 5, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 9, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 9, + 0, + 0, + 0, + 8, + 8, + 0, + 0 + ], + [ + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 9, + 0, + 0, + 8, + 3, + 3, + 8, + 0 + ], + [ + 0, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 8, + 3, + 3, + 8, + 0 + ], + [ + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 9, + 8, + 8, + 0, + 0 + ], + [ + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 8, + 8, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 0 + ], + [ + 1, + 1, + 0, + 0, + 9, + 9, + 9, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 4, + 1, + 0, + 0, + 9, + 3, + 9, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_8e5c0c38.json b/problems/arc2_8e5c0c38.json new file mode 100644 index 0000000..c7c6601 --- /dev/null +++ b/problems/arc2_8e5c0c38.json @@ -0,0 +1,1068 @@ +{ + "problem_id": "arc2_8e5c0c38", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 1 1 1 8 1 1 1 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 1 1 8 8 8 8 8 1 1 8 8 6 6 6 6 8 8 8\n8 8 8 8 8 1 8 8 8 8 8 1 8 8 8 8 6 8 6 8 8 8\n8 8 8 8 1 1 8 1 1 1 8 1 8 8 8 8 6 6 6 8 8 8\n8 8 8 8 1 1 1 1 8 1 1 1 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 2 8 8 8 2 2 2 8 8 8 8\n8 8 8 8 8 8 8 8 8 2 2 8 2 2 2 8 2 2 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 2 2 8 8 8 2 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 1 1 1 8 1 1 1 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 1 1 8 8 8 8 8 1 1 8 8 8 6 6 6 8 8 8\n8 8 8 8 8 1 8 8 8 8 8 1 8 8 8 8 6 8 6 8 8 8\n8 8 8 8 8 1 8 1 1 1 8 1 8 8 8 8 6 6 6 8 8 8\n8 8 8 8 8 1 1 1 8 1 1 1 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 1 8 8 8 1 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 2 8 8 8 2 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 2 2 8 2 2 2 8 2 2 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 2 8 8 8 2 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 0 0 2 2 0 0\n0 0 0 0 0 0 0 8 0 0 0 0 0 0 2 2 0 0 2 2 0 0\n0 0 0 0 0 8 8 0 8 0 0 0 0 0 0 2 2 2 2 0 0 0\n0 0 0 0 0 8 8 0 8 0 0 0 0 0 0 0 2 2 0 0 0 0\n0 0 0 0 0 0 0 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 4 4 4 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 4 4 4 0 0 0 4 4 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 4 4 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2 0 0 2 2 0 0\n0 0 0 0 0 0 0 8 0 0 0 0 0 0 2 2 0 0 2 2 0 0\n0 0 0 0 0 0 8 0 8 0 0 0 0 0 0 2 2 2 2 0 0 0\n0 0 0 0 0 0 8 0 8 0 0 0 0 0 0 0 2 2 0 0 0 0\n0 0 0 0 0 0 0 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 4 4 4 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 4 4 0 0 0 4 4 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 4 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTest Input 1:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 6 6 6 6 1 6 6 6 6 6 6 1 1 1 1 1 1\n1 1 1 1 1 6 6 1 1 1 1 1 1 6 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 6 1 1 1 1 1 1 6 1 1 1 1 1 1 1 1\n1 1 1 6 6 6 6 1 1 1 6 1 1 6 6 6 1 1 1 1 1 1\n1 1 1 6 6 6 6 1 6 6 6 6 1 6 6 6 1 1 1 1 1 1\n1 1 1 1 1 1 6 6 6 1 1 6 6 6 6 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 6 1 1 1 1 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 6 6 6 6 6 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 6 6 1 1 1 1 6 6 6 6 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 6 6 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 6 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 1 3 3 1\n1 1 1 1 1 1 4 1 1 1 1 1 1 1 1 1 1 3 3 3 3 1\n1 1 1 1 1 4 4 4 4 1 1 1 1 1 1 1 1 1 3 1 1 1\n1 4 4 4 4 4 4 4 4 4 4 4 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 4 4 4 4 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 4 4 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTest Input 2:\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 2 2 4 4 4 2 2 2 2 4 4 4 4 4 4 4 4 4 4\n4 4 2 4 4 2 2 2 4 4 2 2 4 4 4 3 3 3 3 3 3 4\n4 4 2 2 4 4 4 4 4 2 2 4 4 4 4 4 3 4 3 4 4 4\n4 4 4 2 4 2 2 2 4 2 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 2 2 2 4 2 2 2 2 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 1 1 1 4 4 1 1 1 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 1 4 1 1 1 1 4 1 4 4 4 4\n4 4 4 4 4 4 4 4 1 1 1 4 4 4 4 4 4 1 1 4 4 4\n4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4 4 1 4 4 4 4\n4 4 4 4 4 4 4 4 4 1 1 1 1 1 1 1 1 1 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 1 1 1 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 6, + 1, + 1, + 6, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 1, + 6, + 6, + 6, + 6, + 1, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 1, + 1, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 6, + 6, + 6, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 6, + 6, + 1, + 1, + 1, + 1, + 6, + 6, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 3, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 3, + 1, + 1, + 1 + ], + [ + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ] + ], + [ + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 2, + 4, + 4, + 4, + 2, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 4, + 4, + 2, + 2, + 2, + 4, + 4, + 2, + 4, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 3, + 4, + 3, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 2, + 4, + 2, + 2, + 2, + 4, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 2, + 2, + 2, + 4, + 2, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 1, + 4, + 4, + 1, + 1, + 1, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 4, + 1, + 1, + 1, + 1, + 4, + 1, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_9bbf930d.json b/problems/arc2_9bbf930d.json new file mode 100644 index 0000000..65bb166 --- /dev/null +++ b/problems/arc2_9bbf930d.json @@ -0,0 +1,539 @@ +{ + "problem_id": "arc2_9bbf930d", + "problem_text": "ARC Puzzle: Predict the test output grid.\n\nTraining Example 1:\nInput:\n6 7 1 1 1 1 1 1 1 1 1 1 1 7 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 1 1 1 1 1 1 1 1 1 1 1 4 7 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 4 7 4\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 7 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 4\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 0 0 0 0 0 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 7 9 9 9 9 9 9 9 9 9 9 9 9 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 9\n6 7 7 9 9 9 9 9 9 9 9 9 9 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 9 7 9\n6 7 7 8 8 8 8 8 8 8 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 3 3 3 3 3 3 3 7 7\n\nOutput:\n6 7 1 1 1 1 1 1 1 1 1 1 1 7 6 7\n7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 6\n6 7 1 1 1 1 1 1 1 1 1 1 1 4 7 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 4 7 4\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 7 4\n7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 4\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 0 0 0 0 0 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 7 9 9 9 9 9 9 9 9 9 9 9 9 9\n7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 9\n6 7 7 9 9 9 9 9 9 9 9 9 9 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 9 7 9\n6 7 7 8 8 8 8 8 8 8 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 3 3 3 3 3 3 3 6 7\n\nTraining Example 2:\nInput:\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 8 8 8 8 8 8 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 1 1 1 1 1 1 1 1 1 1 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 1 1 1 1 1 1 1 1 1 1 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 5 5 5 5 5 5 5 5 5 5 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 0 0 0 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 0 0 0 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 9 9 9 9 9 9 9 9 9 9 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n\nOutput:\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 8 8 8 8 8 8 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 1 1 1 1 1 1 1 1 1 1 7 7\n7 7 7 7 7 7 7 7 7 7 7 7 7 6\n6 7 1 1 1 1 1 1 1 1 1 1 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 5 5 5 5 5 5 5 5 5 5 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 0 0 0 7 7\n7 7 7 7 7 7 7 7 7 7 7 7 7 6\n6 7 0 0 0 0 0 0 0 0 0 0 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 9 9 9 9 9 9 9 9 9 9 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n7 7 7 7 7 7 7 7 7 7 7 7 7 6\n6 7 3 3 3 3 3 3 3 3 3 3 7 7\n\nTraining Example 3:\nInput:\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 7 7 7 7 7 7 7 7 4 7 7 7 7 7 4\n6 7 4 4 4 4 4 4 7 4 7 4 4 4 7 4\n6 7 7 7 7 7 7 4 7 4 7 4 7 4 7 4\n6 7 2 2 2 2 2 2 7 7 7 7 7 4 7 4\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 2 2 2 2 2 2 7 5 7 5 7 9 7 0\n6 7 7 7 7 7 7 7 7 5 7 5 7 9 7 0\n6 7 5 5 5 5 5 5 5 5 7 5 7 9 7 0\n6 7 7 7 7 7 7 7 7 7 7 5 7 9 7 0\n6 7 5 5 5 5 5 5 5 5 5 5 7 9 7 0\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7\n6 7 3 3 3 3 3 7 7 7 3 3 3 3 3 3\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 3\n6 7 3 3 3 3 3 7 7 7 3 3 3 3 7 3\n6 7 7 7 7 7 7 7 7 7 7 7 7 3 7 3\n6 7 0 0 0 0 0 0 0 0 0 0 0 0 7 7\n\nOutput:\n6 7 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n7 7 7 7 7 7 7 7 7 4 7 7 7 7 7 4\n6 7 4 4 4 4 4 4 7 4 7 4 4 4 7 4\n6 7 7 7 7 7 7 4 7 4 7 4 7 4 7 4\n6 7 2 2 2 2 2 2 7 7 7 7 7 4 7 4\n7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 6\n6 7 2 2 2 2 2 2 7 5 7 5 7 9 7 0\n6 7 7 7 7 7 7 7 6 5 7 5 7 9 7 0\n6 7 5 5 5 5 5 5 5 5 7 5 7 9 7 0\n7 7 7 7 7 7 7 7 7 7 7 5 7 9 7 0\n6 7 5 5 5 5 5 5 5 5 5 5 7 9 7 0\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 6 7\n6 7 3 3 3 3 3 7 7 7 3 3 3 3 3 3\n7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 3\n6 7 3 3 3 3 3 7 7 7 3 3 3 3 7 3\n6 7 7 7 7 7 7 7 7 7 7 7 7 3 7 3\n6 7 0 0 0 0 0 0 0 0 0 0 0 0 6 7\n\nTest Input:\n6 7 9 9 9 9 9 9 9 7 7 7 7 7 7 7 9 9 9 9 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 9\n6 7 9 9 9 9 9 9 9 7 7 7 7 0 7 0 9 9 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 0 7 0 7 7 9 7 9\n6 7 0 0 0 0 0 0 0 7 7 7 0 0 7 0 7 7 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 0 7 7 9 7 9\n6 7 0 0 0 0 0 0 0 7 7 7 0 0 0 0 7 7 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 0 7 7 7 7 7 7\n6 7 0 0 0 0 0 0 0 7 7 7 0 7 0 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 1 7 1 7 0 7 0 7 7 7 7 7 7\n6 7 8 8 8 8 8 7 1 7 1 7 0 7 0 8 8 8 8 7 7\n6 7 7 7 7 7 7 7 1 7 1 7 0 7 0 7 7 7 7 7 7\n6 7 1 1 1 1 1 1 1 7 1 7 0 7 0 7 7 7 7 7 7\n6 7 7 7 7 7 7 7 7 7 1 7 0 7 0 0 0 7 7 7 7\n6 7 1 1 1 1 1 1 1 1 1 7 0 7 7 7 7 7 7 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 0 0 0 0 0 7 7 7 7\n6 7 4 4 4 4 4 4 4 4 7 7 7 4 4 4 4 7 7 7 7\n6 7 7 7 7 7 7 7 7 7 7 7 7 7 7 7 4 7 7 7 7\n6 7 4 4 4 4 4 4 4 4 2 7 2 4 4 7 4 7 7 7 7\n6 7 7 7 7 7 7 7 7 7 2 7 2 7 4 7 4 7 9 7 9\n6 7 2 2 2 2 2 2 2 2 2 7 2 7 4 7 4 9 9 7 9\n6 7 7 7 7 7 7 7 7 7 7 7 2 7 7 7 7 7 7 7 9\n6 7 2 2 2 2 2 2 2 2 2 2 2 7 7 7 7 9 9 9 9\n\nGive your answer in ... tags, space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 6, + 7, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 6, + 7, + 6, + 7, + 7, + 6, + 7, + 9, + 9, + 9, + 9, + 9 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 9 + ], + [ + 6, + 7, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 7, + 7, + 7, + 7, + 0, + 7, + 0, + 9, + 9, + 9, + 7, + 9 + ], + [ + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 7, + 0, + 7, + 7, + 9, + 7, + 9 + ], + [ + 6, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0, + 0, + 7, + 0, + 7, + 7, + 9, + 7, + 9 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 7, + 7, + 9, + 7, + 9 + ], + [ + 6, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 7, + 7, + 9, + 7, + 9 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0, + 7, + 0, + 8, + 8, + 8, + 8, + 7, + 7 + ], + [ + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 1, + 7, + 1, + 7, + 0, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 8, + 8, + 8, + 8, + 8, + 7, + 1, + 7, + 1, + 7, + 0, + 7, + 0, + 8, + 8, + 8, + 8, + 7, + 7 + ], + [ + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 1, + 7, + 1, + 7, + 0, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 1, + 7, + 0, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 1, + 7, + 0, + 7, + 0, + 0, + 0, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 6 + ], + [ + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 4, + 4, + 4, + 4, + 7, + 7, + 7, + 7 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 4, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 7, + 2, + 4, + 4, + 7, + 4, + 7, + 7, + 7, + 7 + ], + [ + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 2, + 7, + 2, + 7, + 4, + 7, + 4, + 7, + 9, + 7, + 9 + ], + [ + 6, + 7, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 7, + 2, + 7, + 4, + 7, + 4, + 9, + 9, + 7, + 9 + ], + [ + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 2, + 6, + 7, + 7, + 7, + 7, + 7, + 7, + 9 + ], + [ + 6, + 7, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 7, + 7, + 6, + 7, + 9, + 9, + 9, + 9 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_a25697e4.json b/problems/arc2_a25697e4.json new file mode 100644 index 0000000..ffcce91 --- /dev/null +++ b/problems/arc2_a25697e4.json @@ -0,0 +1,1782 @@ +{ + "problem_id": "arc2_a25697e4", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 4 4 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 4 4 3 3 3 3 3 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n4 4 4 4 1 1 1 1 3 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 3 3 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTraining Example 2:\nInput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 3 3 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 4 4 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 4 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 4 4 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n3 3 3 3 1 1 1 1 4 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 3 3 4 4 4 4 4 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nTraining Example 3:\nInput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 5 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 5 5 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 5 5 5 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 7 7 7 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 7 1 1 1 1 6 1 1 1 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 7 1 1 1 1 6 1 6 6 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 6 1 6 6 6 1 1 1 1 1 1 1 1 1\n\nOutput:\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 5 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 5 5 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 5 5 5 1 1 1 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 6 7 7 7 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 6 7 6 6 6 1 1 1 1 1 1 1 1 1\n1 1 1 1 1 1 1 1 1 1 1 6 7 6 6 6 1 1 1 1 1 1 1 1 1\n\nTest Input 1:\n4 4 2 2 2 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 2 2 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 2 2 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 2 2 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 2 2 4 4 2 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 2 2\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4 4 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4 4 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4 4 2 2 2 2 2\n4 4 4 4 4 4 4 4 4 4 4 3 3 3 3 3 1 1 1 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 3 1 1 1 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 1 4 3 3 3 3 3 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 1 1 3 3 3 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 1 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nTest Input 2:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 2 8 2 2 2 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 2 8 8 2 2 8 8 8\n8 8 8 8 8 8 8 8 8 4 6 6 8 8 8 8 2 2 8 8 8 2 8 8 8\n8 8 8 8 8 8 4 4 4 4 6 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 6 6 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 7 7 7 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 3 3 7 7 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 3 8 7 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 4, + 4, + 2, + 2, + 2, + 3, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 2, + 3, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 2, + 3, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 2, + 3, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 2, + 2, + 3, + 3, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 4, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 1, + 1, + 1, + 1, + 1, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 3, + 1, + 1, + 1, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 4, + 1, + 1, + 1, + 1, + 1 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 2, + 2, + 2 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ] + ], + [ + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 2, + 7, + 2, + 2, + 2, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 2, + 7, + 7, + 2, + 2, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 2, + 7, + 7, + 7, + 2, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 6, + 3, + 3, + 3, + 3 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 4, + 4, + 4, + 4 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 6, + 4, + 3, + 3, + 3 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_a32d8b75.json b/problems/arc2_a32d8b75.json new file mode 100644 index 0000000..b927a9b --- /dev/null +++ b/problems/arc2_a32d8b75.json @@ -0,0 +1,1392 @@ +{ + "problem_id": "arc2_a32d8b75", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 6 5 5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 5 5\n0 7 7 7 0 6 5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n0 7 7 4 0 6 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n0 7 4 7 0 6 5 5 5 3 3 3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 3 3 3 3\n0 0 0 0 0 6 5 5 5 3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3\n0 0 0 0 0 6 5 5 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n1 1 1 0 0 6 5 5 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 1 0 0 6 5 5 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3\n0 0 1 0 0 6 5 3 3 3 3 8 8 8 8 8 8 8 1 1 1 8 8 8 8 8 8 8 8 3\n0 1 1 1 0 6 5 3 3 3 8 8 8 8 8 8 8 1 1 1 1 8 8 8 8 8 8 8 8 3\n1 1 1 1 1 6 5 3 3 3 8 8 8 8 8 8 8 1 1 1 1 8 8 8 8 8 8 8 8 3\n1 0 1 0 1 6 5 3 3 3 8 8 8 8 8 8 8 1 1 1 1 8 8 8 8 8 8 8 8 3\n6 6 6 6 6 6 5 3 3 3 8 8 8 8 8 8 8 8 1 1 8 8 8 8 8 8 8 8 8 3\n6 0 0 0 6 6 5 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3\n6 0 0 0 6 6 5 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3\n6 0 0 4 6 6 5 5 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3\n6 6 6 6 6 6 5 5 5 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3\n6 0 0 0 6 6 5 5 5 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 5\n6 0 7 0 6 6 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 5 5\n6 0 7 0 6 6 5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 5 5 5\n\nOutput:\n5 5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 5 5\n5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n5 5 5 3 3 3 3 3 3 4 4 4 3 3 3 4 4 4 3 3 3 4 4 4\n5 5 5 3 3 3 3 3 3 4 4 7 8 8 8 4 4 7 8 8 3 4 4 7\n5 5 5 3 3 3 3 3 3 4 7 4 8 8 8 4 7 4 8 8 8 4 7 4\n5 5 3 3 3 3 3 8 8 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n5 5 3 3 3 3 8 8 8 4 4 7 4 4 7 4 4 7 4 4 7 4 4 7\n5 5 3 3 3 8 8 8 8 4 7 4 4 7 4 4 7 4 4 7 4 4 7 4\n5 3 3 3 3 8 8 8 8 8 8 8 4 4 4 4 4 4 4 4 4 8 8 3\n5 3 3 3 8 8 8 8 8 8 8 1 4 4 7 4 4 7 4 4 7 8 8 3\n5 3 3 3 8 8 8 8 8 8 8 1 4 7 4 4 7 4 4 7 4 8 8 3\n5 3 3 3 8 8 8 8 8 8 8 1 1 1 1 4 4 4 8 8 8 8 8 3\n5 3 3 3 8 8 8 8 8 8 8 8 1 1 8 4 4 7 8 8 8 8 8 3\n5 3 3 3 8 8 8 8 8 8 8 8 8 8 8 4 7 4 8 8 8 8 3 3\n5 3 3 3 3 8 8 8 8 8 8 8 8 8 8 4 4 4 8 8 8 8 3 3\n5 5 3 3 3 8 8 8 8 8 8 8 8 8 8 4 4 7 8 8 8 3 3 3\n5 5 5 3 3 3 8 8 8 8 8 8 8 8 8 4 7 4 8 8 3 3 3 3\n5 5 5 3 3 3 3 8 8 8 8 8 8 8 8 4 4 4 4 4 4 4 4 4\n5 5 5 3 3 3 3 3 3 3 3 3 3 3 3 4 4 7 4 4 7 4 4 7\n5 5 5 5 3 3 3 3 3 3 3 3 3 3 3 4 7 4 4 7 4 4 7 4\n\nTraining Example 2:\nInput:\n0 0 0 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 1 1 2 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 1 1 1 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 2 1 2 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 0 0 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 4 0 4 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 0 4 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 0 4 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 4 0 4 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 4 0 4 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 0 4 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n0 0 0 0 0 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 6 6 6 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 4 0 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 0 0 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 0 0 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 6 6 6 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 0 7 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 0 7 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n6 0 0 0 6 6 8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n\nOutput:\n2 2 1 8 8 9 2 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n2 2 2 8 8 9 2 2 2 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n1 2 1 8 8 9 1 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 2 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 1 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 2 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 1 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n2 2 1 8 8 9 2 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n2 2 2 8 8 9 2 2 2 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n1 2 1 8 8 9 1 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n2 2 1 8 8 9 2 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n2 2 2 8 8 9 2 2 2 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n1 2 1 8 8 9 1 2 1 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 2 2 2 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 1 2 1 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n8 8 8 8 8 9 9 9 9 9 8 8 8 8 8 9 9 9 9 9 8 8 8 8\n\nTraining Example 3:\nInput:\n0 0 0 0 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 3 3 3 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 8 3 8 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 8 3 3 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 0 0 0 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 2 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 2 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 2 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n0 0 0 0 0 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n6 6 6 6 6 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n6 0 0 4 6 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n6 0 0 0 6 6 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n6 0 0 0 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 6 6 6 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 0 0 0 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 0 7 7 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 0 0 0 6 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nOutput:\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 8 8 8 8 8 8 8 8 8\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 8 3 3 8 3 3 8 3\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 8 8 3 8 8 3 8 8\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 8 8 8 5 5 5 8 8 8\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 3 8 3 5 5 5 3 8 3\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 3 8 8 4 4 4 3 8 8\n4 4 4 4 4 4 4 4 4 8 8 8 8 8 8 8 8 8 4 4 4 8 8 8\n4 4 4 4 4 4 4 4 4 3 8 3 3 8 3 3 8 3 4 4 4 3 8 3\n4 4 4 4 4 4 4 4 4 3 8 8 3 8 8 3 8 8 4 4 4 3 8 8\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5 5\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n\nTest Input 1:\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 1 1 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 1 3 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 2 4 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 4 2 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 3 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 3 3\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 3\n0 7 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 3 3 3 3\n7 7 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 3 0 3 0\n7 0 0 7 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 3 3 3 3\n7 7 7 7 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 7 0 0 6 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 6 0 0 0 0\n0 7 7 7 6 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 6 0 0 0 0\n0 0 0 7 6 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 6 0 0 0 0\n0 7 7 7 6 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n0 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 0\n6 6 6 6 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 6 6 6 6\n6 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 4 0 0 6\n6 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 6\n6 0 0 4 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 6\n6 6 6 6 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 6 6 6 6\n6 0 7 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 0 0 6\n6 0 7 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 7 0 6\n6 0 0 0 6 9 9 9 9 9 9 9 9 0 0 0 0 9 9 9 9 9 9 9 9 6 0 7 0 6\n\nTest Input 2:\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 2 2 2 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 3 3 3 3 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 2 2 2 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 3 3 3 3 2 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 2 2 2 2 2 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 4 4 4 4 4 0 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 4 4 0 0 4 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 4 0 0 0 4 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 4 4 4 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n0 0 0 0 0 0 0 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4\n6 6 6 6 6 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 0 0 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 0 0 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 4 0 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 6 6 6 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 0 0 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 7 7 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n6 6 0 0 0 6 6 6 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 4, + 2, + 4, + 2, + 4, + 2, + 4, + 2, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 2, + 4, + 2, + 4, + 2, + 4, + 2, + 4, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 4, + 2, + 9, + 9, + 4, + 2, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 2, + 4, + 9, + 9, + 2, + 4, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 4, + 2, + 4, + 2, + 4, + 2, + 4, + 2, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 2, + 4, + 2, + 4, + 2, + 4, + 2, + 4, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 4, + 2, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 2, + 4, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 4, + 2, + 4, + 2, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 2, + 4, + 2, + 4, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 4, + 2, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 2, + 4, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 1, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 0, + 0, + 0, + 0 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 3, + 1, + 3, + 1, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 3, + 3, + 9, + 9, + 9, + 9, + 3, + 3 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 3, + 1, + 9, + 9, + 9, + 9, + 3, + 1 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 3, + 1, + 3, + 1, + 3, + 1, + 3, + 1 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 3, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 1, + 9, + 9, + 9, + 9 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 1, + 3, + 1, + 3, + 1 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 3, + 3 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 9, + 9, + 9, + 9, + 3, + 1 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 9, + 0, + 0, + 0, + 0, + 9, + 9, + 3, + 1, + 3, + 1, + 3, + 1 + ] + ], + [ + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 2, + 2, + 2, + 2, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1 + ], + [ + 2, + 2, + 2, + 2, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 4 + ], + [ + 3, + 2, + 2, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 2, + 2, + 2, + 2, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 4 + ], + [ + 2, + 2, + 2, + 2, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 2, + 2, + 2, + 2, + 3, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 4, + 4, + 4, + 4, + 4, + 3, + 3, + 3, + 3, + 3, + 4, + 4 + ], + [ + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 4, + 4, + 4, + 4, + 4, + 3, + 2, + 2, + 2, + 2, + 4, + 4 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 3, + 3, + 1, + 1 + ], + [ + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 1, + 1, + 1, + 1, + 1, + 2, + 2, + 2, + 2, + 3, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1, + 1, + 1, + 1, + 3, + 3, + 3, + 3, + 3, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1 + ], + [ + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1 + ], + [ + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 2, + 2, + 2, + 2, + 3, + 1, + 1 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 1, + 1 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_abc82100.json b/problems/arc2_abc82100.json new file mode 100644 index 0000000..3f83cd2 --- /dev/null +++ b/problems/arc2_abc82100.json @@ -0,0 +1,450 @@ +{ + "problem_id": "arc2_abc82100", + "problem_text": "ARC Puzzle: Predict the test output grid.\n\nTraining Example 1:\nInput:\n1 2 8 8 8\n0 0 0 0 1\n0 0 0 1 0\n0 0 0 1 0\n0 0 0 0 1\n\nOutput:\n0 0 0 0 0\n0 0 0 0 2\n0 0 0 2 2\n0 0 0 2 2\n0 0 0 0 2\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 6 0 6 0 6 0 6 0 6 0 6 0 6 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 0 0 0 0 0 0 0 0 0 0 0 4 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 0 0 0 0 0 0 0 0 0 0 0 4 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 0 0\n0 2 0 8 0 8 0 0 0 0 0 0 0 4 0\n0 0 0 0 7 0 0 0 0 0 0 0 0 0 0\n0 8 0 0 6 0 0 8 0 0 0 0 0 0 0\n8 0 4 2 0 4 2 0 8 0 0 0 0 0 0\n0 8 0 0 7 0 0 8 0 0 0 0 0 2 0\n0 0 0 0 6 0 0 0 0 0 0 0 0 0 0\n0 7 0 8 0 8 0 7 0 7 0 7 0 0 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 7 0 7 0 7 0 7 0 7 0 7 0 7 0\n7 0 7 0 7 0 7 0 7 0 7 0 7 0 7\n0 4 0 0 0 0 0 0 0 0 0 0 0 2 0\n4 0 0 0 0 0 0 0 0 0 0 0 0 0 2\n0 4 0 0 0 0 0 0 0 0 0 0 0 2 0\n4 0 0 0 0 0 0 0 0 0 0 0 0 0 2\n0 4 0 0 0 0 0 0 0 0 0 0 0 2 0\n4 0 0 0 0 0 0 0 0 0 0 0 0 0 2\n0 4 0 0 0 0 0 0 0 0 0 0 0 2 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 4 0\n0 0 0 0 0 0 0 0 0 0 0 0 4 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 4 0\n6 0 6 0 0 0 6 0 6 0 6 0 6 0 0\n0 6 0 0 0 0 0 6 0 6 0 6 0 0 0\n\nTraining Example 3:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 4 0 0 0 0 0 0 0 0 0 0 0 4 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 0 0 0 0 0 0 8 0 0 0 4 0 0 0 4 0 0\n0 0 0 0 0 0 0 0 8 0 8 0 0 0 0 0 0 0 0 0\n0 0 0 4 0 0 0 8 0 0 0 8 0 0 0 4 0 0 0 0\n0 0 0 0 0 0 8 0 0 0 0 0 8 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 8 0 0 0 8 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 8 0 8 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 8 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 2 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 4 0 0 0 0 0 0 0 0 0 0\n0 0 1 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 7 0 0 0 0 0\n1 0 0 0 1 0 0 0 0 0 0 0 8 0 0 0 8 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 8 0 8 0 0 0 0\n0 0 1 0 0 0 0 0 0 0 0 0 0 0 8 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 8 0 8 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 8 0 0 0 8 0 0 0\n\nOutput:\n0 2 0 2 0 2 0 0 0 0 0 2 0 2 0 2 0 2 0 2\n0 0 2 0 2 0 0 0 0 0 2 0 0 0 2 0 2 0 0 0\n0 2 0 2 0 2 0 0 0 0 0 2 0 2 0 2 0 2 0 2\n2 0 2 0 0 0 2 0 0 0 0 0 2 0 2 0 2 0 2 0\n0 2 0 0 0 2 0 0 0 0 0 0 0 2 0 0 0 2 0 0\n0 0 2 0 2 0 0 0 0 0 0 0 0 0 2 0 2 0 0 0\n0 0 0 2 0 0 0 0 0 0 0 0 0 0 0 2 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n7 0 0 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 7 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 7 0 0 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 7 0 7 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n7 0 0 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 7 0 7 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 7 0 0 0 7 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTraining Example 4:\nInput:\n1 1 1 1 1 2 0 0\n0 0 0 0 0 2 0 0\n0 0 0 0 0 2 0 0\n0 2 1 8 0 2 0 0\n0 0 0 0 0 2 0 0\n0 0 8 0 0 2 0 0\n0 0 2 0 0 2 0 0\n0 0 1 0 0 2 0 0\n\nOutput:\n2 2 2 2 2 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n0 0 0 0 0 1 0 0\n\nTest Input:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 6 0 0\n2 0 0 8 0 0 0 6 0 0 0 0 0 0 0 0 0 0 0 6\n0 4 1 8 0 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0\n0 0 0 8 0 0 0 0 0 0 0 0 0 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 0 0 0 0 4 0 0\n0 2 4 8 0 8 0 0 0 0 0 2 0 0 0 0 0 0 0 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 2 0 0 0 0 0 0 0 0 0 0 0 5 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 4 0 0 0 0 0 0\n0 5 7 8 8 0 0 0 0 5 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 0 0 0 2 0 0 0 0 0 0 0 2 0 0 0 0 0 6\n0 0 0 0 0 0 0 0 0 4 0 0 0 0 0 0 0 0 0 0\n0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 4 0 0 6 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n5 0 0 0 0 0 0 0 0 6 0 0 0 0 0 0 0 0 0 0\n\nGive your answer in ... tags, space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 0, + 0 + ], + [ + 4, + 0, + 4, + 0, + 0, + 0, + 0, + 6, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6 + ], + [ + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 1, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 1, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 4, + 0, + 0, + 0, + 1, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 4, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 7, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 7, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 4, + 0, + 0 + ], + [ + 0, + 4, + 0, + 4, + 0, + 4, + 0, + 4, + 0, + 1, + 0, + 0, + 0, + 4, + 0, + 4, + 0, + 0, + 0, + 6 + ], + [ + 0, + 0, + 4, + 7, + 0, + 0, + 4, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 6, + 0, + 0, + 0 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_d35bdbdc.json b/problems/arc2_d35bdbdc.json new file mode 100644 index 0000000..1643fb3 --- /dev/null +++ b/problems/arc2_d35bdbdc.json @@ -0,0 +1,374 @@ +{ + "problem_id": "arc2_d35bdbdc", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 3 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0 3 3 3\n0 0 5 5 5 5 5 3 4 3\n0 5 0 0 0 0 0 3 3 3\n0 5 4 4 4 0 0 0 0 0\n5 0 4 2 4 0 0 6 6 6\n0 5 4 4 4 0 5 6 1 6\n0 5 5 5 5 5 0 6 6 6\n0 0 1 1 1 0 0 0 0 0\n0 0 1 3 1 0 0 0 0 0\n0 0 1 1 1 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 3 3 3\n0 0 5 5 5 5 5 3 2 3\n0 5 0 0 0 0 0 3 3 3\n0 5 0 0 0 0 0 0 0 0\n5 0 0 0 0 0 0 6 6 6\n0 5 0 0 0 0 5 6 3 6\n0 5 5 5 5 5 0 6 6 6\n0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0\n\nTraining Example 2:\nInput:\n2 2 2 0 0 0 3 3 3 0\n2 6 2 0 0 0 3 2 3 0\n2 2 2 0 5 0 3 3 3 0\n0 0 0 5 0 5 5 5 5 0\n8 8 8 0 5 0 0 1 1 1\n8 3 8 0 0 5 0 1 4 1\n8 8 8 0 5 0 0 1 1 1\n0 5 0 5 4 4 4 0 0 0\n0 5 5 0 4 8 4 0 0 0\n0 0 0 0 4 4 4 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0\n0 0 0 0 5 0 0 0 0 0\n0 0 0 5 0 5 5 5 5 0\n8 8 8 0 5 0 0 1 1 1\n8 2 8 0 0 5 0 1 8 1\n8 8 8 0 5 0 0 1 1 1\n0 5 0 5 0 0 0 0 0 0\n0 5 5 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0\n\nTraining Example 3:\nInput:\n1 1 1 0 0 0 0 4 4 4\n1 2 1 0 0 0 0 4 3 4\n1 1 1 0 0 5 0 4 4 4\n0 5 0 0 5 0 5 0 0 0\n0 5 0 5 3 3 3 5 0 0\n0 0 5 0 3 6 3 0 5 0\n0 0 0 0 3 3 3 0 5 0\n2 2 2 0 0 0 0 7 7 7\n2 9 2 0 0 0 0 7 4 7\n2 2 2 0 0 0 0 7 7 7\n\nOutput:\n1 1 1 0 0 0 0 0 0 0\n1 9 1 0 0 0 0 0 0 0\n1 1 1 0 0 5 0 0 0 0\n0 5 0 0 5 0 5 0 0 0\n0 5 0 5 0 0 0 5 0 0\n0 0 5 0 0 0 0 0 5 0\n0 0 0 0 0 0 0 0 5 0\n0 0 0 0 0 0 0 7 7 7\n0 0 0 0 0 0 0 7 3 7\n0 0 0 0 0 0 0 7 7 7\n\nTest Input 1:\n0 0 0 0 0 0 0 2 0 0\n0 0 4 0 0 0 2 3 2 0\n0 4 2 4 0 0 0 2 0 0\n0 0 4 0 0 0 0 5 0 0\n0 0 0 0 0 0 5 0 0 0\n0 0 0 0 1 0 5 0 3 0\n0 7 0 1 9 1 5 3 3 3\n7 1 7 0 1 0 5 0 3 0\n0 7 0 5 0 5 0 0 0 0\n0 5 5 0 5 0 0 0 0 0\n\nTest Input 2:\n0 0 0 4 4 4 0 2 2 2\n0 0 5 4 2 4 5 2 3 2\n0 0 5 4 4 4 5 2 2 2\n0 0 0 5 0 0 5 5 5 5\n0 0 5 1 1 1 0 0 0 5\n0 5 0 1 3 1 5 5 5 0\n0 0 5 1 1 1 5 3 3 3\n6 6 6 5 0 0 5 3 6 3\n6 9 6 5 5 5 5 3 3 3\n6 6 6 0 0 0 0 0 0 0\n\nTest Input 3:\n0 0 0 1 1 1 0 6 6 6\n0 0 0 1 3 1 0 6 1 6\n0 0 0 1 1 1 0 6 6 6\n5 5 5 5 5 0 0 0 5 0\n5 2 2 2 5 0 0 0 5 0\n5 2 4 2 5 3 3 3 5 0\n5 2 2 2 5 3 9 3 0 5\n0 5 5 0 5 3 3 3 0 5\n0 7 7 7 0 5 5 0 0 5\n0 7 2 7 0 0 0 5 5 0\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 3, + 2, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 7, + 9, + 7, + 0, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 0, + 7, + 0, + 5, + 0, + 5, + 0, + 0, + 0, + 0 + ], + [ + 0, + 5, + 5, + 0, + 5, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 0, + 0, + 0, + 4, + 4, + 4, + 0, + 2, + 2, + 2 + ], + [ + 0, + 0, + 5, + 4, + 3, + 4, + 5, + 2, + 6, + 2 + ], + [ + 0, + 0, + 5, + 4, + 4, + 4, + 5, + 2, + 2, + 2 + ], + [ + 0, + 0, + 0, + 5, + 0, + 0, + 5, + 5, + 5, + 5 + ], + [ + 0, + 0, + 5, + 0, + 0, + 0, + 0, + 0, + 0, + 5 + ], + [ + 0, + 5, + 0, + 0, + 0, + 0, + 5, + 5, + 5, + 0 + ], + [ + 0, + 0, + 5, + 0, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 5, + 0, + 0, + 5, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 5, + 5, + 5, + 5, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 3, + 6 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6 + ], + [ + 5, + 5, + 5, + 5, + 5, + 0, + 0, + 0, + 5, + 0 + ], + [ + 5, + 0, + 0, + 0, + 5, + 0, + 0, + 0, + 5, + 0 + ], + [ + 5, + 0, + 0, + 0, + 5, + 0, + 0, + 0, + 5, + 0 + ], + [ + 5, + 0, + 0, + 0, + 5, + 0, + 0, + 0, + 0, + 5 + ], + [ + 0, + 5, + 5, + 0, + 5, + 0, + 0, + 0, + 0, + 5 + ], + [ + 0, + 7, + 7, + 7, + 0, + 5, + 5, + 0, + 0, + 5 + ], + [ + 0, + 7, + 4, + 7, + 0, + 0, + 0, + 5, + 5, + 0 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_d8e07eb2.json b/problems/arc2_d8e07eb2.json new file mode 100644 index 0000000..fdeab35 --- /dev/null +++ b/problems/arc2_d8e07eb2.json @@ -0,0 +1,1452 @@ +{ + "problem_id": "arc2_d8e07eb2", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 0 0 0 8 8 1 1 1 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 0 0 0 8 8 8 1 8 8 8 7 7 7 8 8 8 8 6 8 8\n8 8 0 0 0 8 8 1 1 1 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 0 0 0 3 3 1 1 1 3 3 7 3 3 3 3 3 6 6 3 3\n3 3 0 0 0 3 3 3 1 3 3 3 7 7 7 3 3 3 3 6 3 3\n3 3 0 0 0 3 3 1 1 1 3 3 7 3 3 3 3 3 6 6 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 8\n8 3 7 3 3 3 3 1 1 1 3 3 3 6 6 3 3 0 0 0 3 8\n8 3 7 7 7 3 3 3 1 3 3 3 3 3 6 3 3 0 0 0 3 8\n8 3 7 3 3 3 3 1 1 1 3 3 3 6 6 3 3 0 0 0 3 8\n8 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n\nTraining Example 2:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 0 8 8 8 8 1 1 1 8 8 6 6 6 8 8 2 2 8 8 8\n8 8 0 0 0 8 8 8 1 8 8 8 6 8 6 8 8 2 2 2 8 8\n8 8 0 8 0 8 8 1 1 1 8 8 6 8 6 8 8 8 2 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 0 3 3 3 3 1 1 1 3 3 6 6 6 3 3 2 2 3 3 3\n3 3 0 0 0 3 3 3 1 3 3 3 6 3 6 3 3 2 2 2 3 3\n3 3 0 3 0 3 3 1 1 1 3 3 6 3 6 3 3 3 2 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 3 0 3 3 3 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 3 0 0 0 3 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 3 0 3 0 3 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 3 1 1 1 3 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 3 3 1 3 3 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 3 1 1 1 3 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 3 2 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 3 2 2 2 3 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 3 3 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 3 6 6 6 3 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 3 6 3 6 3 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 3 6 3 6 3 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3\n\nTraining Example 3:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 4 8 4 8 8 2 2 8 8 8 2 2 2 8 8\n8 8 8 2 8 8 8 4 8 4 8 8 2 2 2 8 8 2 8 2 8 8\n8 8 2 8 2 8 8 4 4 4 8 8 8 2 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 4 8 4 8 8 2 2 8 8 8 2 2 2 8 8\n8 8 8 2 8 8 8 4 8 4 8 8 2 2 2 8 8 2 8 2 8 8\n8 8 2 8 2 8 8 4 4 4 8 8 8 2 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 2 3 2 3 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 3 3 2 3 3 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 3 2 3 2 3 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 3 4 3 4 3 3 2 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 3 4 3 4 3 3 2 2 2 3 8 5 8 8 8 8 1 1 8 8 8\n8 3 4 4 4 3 3 3 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 3 3 3 3 3 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 3 2 2 2 3 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 3 2 3 2 3 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 3 2 2 2 3 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nTraining Example 4:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 0 0 0 8 8 2 2 8 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 0 0 0 8 8 2 2 2 8 8 7 7 7 8 8 8 8 6 8 8\n8 8 0 0 0 8 8 8 2 8 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 0 0 0 8 8 2 2 8 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 0 0 0 8 8 2 2 2 8 8 7 7 7 8 8 8 8 6 8 8\n8 8 0 0 0 8 8 8 2 8 8 8 7 8 8 8 8 8 6 6 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 3 8 8 8 8 8 3 3 3 3 3 3 3 3 3 3 8\n8 3 7 3 3 3 8 1 1 1 8 3 3 6 6 3 3 0 0 0 3 8\n8 3 7 7 7 3 8 8 1 8 8 3 3 3 6 3 3 0 0 0 3 8\n8 3 7 3 3 3 8 1 1 1 8 3 3 6 6 3 3 0 0 0 3 8\n8 3 3 3 3 3 8 8 8 8 8 3 3 3 3 3 3 3 3 3 3 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 3 2 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 3 2 2 2 3 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 3 3 2 3 3 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nTraining Example 5:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 1 1 1 8 8 1 8 1 8 8 9 8 9 8 8 8 8 8 8 8\n8 8 8 1 8 8 8 1 1 8 8 8 9 9 8 8 8 8 8 8 8 8\n8 8 1 1 1 8 8 1 8 1 8 8 9 9 9 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 1 1 1 8 8 1 8 1 8 8 9 8 9 8 8 8 8 8 8 8\n8 8 8 1 8 8 8 1 1 8 8 8 9 9 8 8 8 8 8 8 8 8\n8 8 1 1 1 8 8 1 8 1 8 8 9 9 9 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 3 9 3 9 3 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 3 9 9 3 3 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 3 9 9 9 3 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 3 1 1 1 3 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 3 3 1 3 3 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 3 1 1 1 3 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 3 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 3 1 3 1 3 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 3 1 1 3 3 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 3 1 3 1 3 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 3 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n\nTest Input 1:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 0 0 0 8 8 1 8 1 8 8 9 8 9 8 8 2 2 2 8 8\n8 8 0 0 0 8 8 1 1 8 8 8 9 9 8 8 8 2 8 2 8 8\n8 8 0 0 0 8 8 1 8 1 8 8 9 9 9 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nTest Input 2:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 7 8 8 8 8 2 2 8 8 8 5 5 8 8 8\n8 8 8 2 8 8 8 7 7 7 8 8 2 2 2 8 8 5 8 8 8 8\n8 8 2 8 2 8 8 7 8 8 8 8 8 2 8 8 8 5 5 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 2 8 2 8 8 0 8 8 8 8 8 8 7 8 8 9 8 9 8 8\n8 8 8 2 8 8 8 0 0 0 8 8 8 8 7 8 8 9 9 8 8 8\n8 8 2 8 2 8 8 0 8 0 8 8 7 7 7 8 8 9 9 9 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 7 7 7 8 8 8 1 8 8 8 8 8 6 8 8 0 0 0 8 8\n8 8 7 8 8 8 8 1 1 1 8 8 8 6 6 8 8 0 0 0 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 4 8 4 8 8 2 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 4 8 4 8 8 2 2 2 8 8 5 8 8 8 8 1 1 8 8 8\n8 8 4 4 4 8 8 8 2 8 8 8 5 5 8 8 8 1 8 1 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 9 8 8 8 8 6 6 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 9 9 9 8 8 6 8 6 8 8 4 4 4 8 8 2 8 2 8 8\n8 8 8 8 9 8 8 6 8 6 8 8 8 4 8 8 8 2 2 2 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6 6\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 0, + 0, + 0, + 3, + 3, + 1, + 3, + 1, + 3, + 3, + 9, + 3, + 9, + 3, + 3, + 2, + 2, + 2, + 3, + 3 + ], + [ + 3, + 3, + 0, + 0, + 0, + 3, + 3, + 1, + 1, + 3, + 3, + 3, + 9, + 9, + 3, + 3, + 3, + 2, + 3, + 2, + 3, + 3 + ], + [ + 3, + 3, + 0, + 0, + 0, + 3, + 3, + 1, + 3, + 1, + 3, + 3, + 9, + 9, + 9, + 3, + 3, + 2, + 2, + 2, + 3, + 3 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 2, + 8, + 2, + 8, + 8, + 0, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 3, + 9, + 3, + 9, + 3, + 8 + ], + [ + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 0, + 0, + 0, + 8, + 8, + 8, + 8, + 7, + 8, + 3, + 9, + 9, + 3, + 3, + 8 + ], + [ + 8, + 8, + 2, + 8, + 2, + 8, + 8, + 0, + 8, + 0, + 8, + 8, + 7, + 7, + 7, + 8, + 3, + 9, + 9, + 9, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 1, + 1, + 1, + 8, + 8, + 8, + 6, + 6, + 8, + 3, + 0, + 0, + 0, + 3, + 8 + ], + [ + 8, + 8, + 7, + 7, + 7, + 8, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 3, + 0, + 0, + 0, + 3, + 8 + ], + [ + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 1, + 1, + 1, + 8, + 8, + 8, + 6, + 6, + 8, + 3, + 0, + 0, + 0, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 4, + 8, + 4, + 8, + 8, + 2, + 2, + 8, + 8, + 8, + 5, + 5, + 8, + 8, + 3, + 1, + 3, + 1, + 3, + 8 + ], + [ + 8, + 8, + 4, + 8, + 4, + 8, + 8, + 2, + 2, + 2, + 8, + 8, + 5, + 8, + 8, + 8, + 3, + 1, + 1, + 3, + 3, + 8 + ], + [ + 8, + 8, + 4, + 4, + 4, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 5, + 5, + 8, + 8, + 3, + 1, + 3, + 1, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 6, + 6, + 6, + 8, + 8, + 8, + 4, + 8, + 8, + 3, + 2, + 2, + 2, + 3, + 8 + ], + [ + 8, + 8, + 9, + 9, + 9, + 8, + 8, + 6, + 8, + 6, + 8, + 8, + 4, + 4, + 4, + 8, + 3, + 2, + 3, + 2, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 9, + 8, + 8, + 6, + 8, + 6, + 8, + 8, + 8, + 4, + 8, + 8, + 3, + 2, + 2, + 2, + 3, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 8 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ], + [ + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3 + ] + ], + [ + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 2, + 8, + 2, + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 2, + 2, + 8, + 8, + 8, + 5, + 5, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 7, + 7, + 7, + 8, + 8, + 2, + 2, + 2, + 8, + 8, + 5, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 2, + 8, + 2, + 8, + 8, + 7, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 5, + 5, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 3, + 2, + 3, + 2, + 3, + 8, + 0, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 8, + 9, + 8, + 9, + 8, + 8 + ], + [ + 8, + 3, + 3, + 2, + 3, + 3, + 8, + 0, + 0, + 0, + 8, + 8, + 8, + 8, + 7, + 8, + 8, + 9, + 9, + 8, + 8, + 8 + ], + [ + 8, + 3, + 2, + 3, + 2, + 3, + 8, + 0, + 8, + 0, + 8, + 8, + 7, + 7, + 7, + 8, + 8, + 9, + 9, + 9, + 8, + 8 + ], + [ + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 3, + 7, + 3, + 3, + 3, + 8, + 1, + 1, + 1, + 8, + 8, + 8, + 6, + 6, + 8, + 8, + 0, + 0, + 0, + 8, + 8 + ], + [ + 8, + 3, + 7, + 7, + 7, + 3, + 8, + 8, + 1, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 0, + 0, + 0, + 8, + 8 + ], + [ + 8, + 3, + 7, + 3, + 3, + 3, + 8, + 1, + 1, + 1, + 8, + 8, + 8, + 6, + 6, + 8, + 8, + 0, + 0, + 0, + 8, + 8 + ], + [ + 8, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 4, + 8, + 4, + 8, + 3, + 2, + 2, + 3, + 3, + 3, + 5, + 5, + 3, + 3, + 8, + 1, + 8, + 1, + 8, + 8 + ], + [ + 8, + 8, + 4, + 8, + 4, + 8, + 3, + 2, + 2, + 2, + 3, + 3, + 5, + 3, + 3, + 3, + 8, + 1, + 1, + 8, + 8, + 8 + ], + [ + 8, + 8, + 4, + 4, + 4, + 8, + 3, + 3, + 2, + 3, + 3, + 3, + 5, + 5, + 3, + 3, + 8, + 1, + 8, + 1, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 6, + 6, + 6, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 2, + 2, + 2, + 8, + 8 + ], + [ + 8, + 8, + 9, + 9, + 9, + 8, + 8, + 6, + 8, + 6, + 8, + 8, + 4, + 4, + 4, + 8, + 8, + 2, + 8, + 2, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 9, + 8, + 8, + 6, + 8, + 6, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 2, + 2, + 2, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6, + 6 + ], + [ + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ], + [ + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 2 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_e12f9a14.json b/problems/arc2_e12f9a14.json new file mode 100644 index 0000000..44e331d --- /dev/null +++ b/problems/arc2_e12f9a14.json @@ -0,0 +1,1932 @@ +{ + "problem_id": "arc2_e12f9a14", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 3 3 8 8 8 8 8 8 3 3 8 8 8 3 8 3 3 8 8 8\n8 8 8 3 9 9 3 8 8 8 8 3 1 1 3 8 8 3 4 4 3 8 8 8\n8 8 8 3 9 9 3 8 8 8 8 3 1 1 3 8 8 3 4 4 3 8 8 8\n8 8 8 8 3 3 8 8 8 8 8 8 3 3 8 8 8 3 8 3 3 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 6 6 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 6 6 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 8 8 1 4 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 8 1 4 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 8 1 4 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 1 4 8 8 8 8 8\n9 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 1 4 8 8 8 8 8\n8 9 8 8 8 8 8 8 9 1 8 8 8 8 8 8 1 8 4 8 8 8 8 8\n8 8 9 8 8 8 8 9 8 8 1 8 8 8 8 1 8 8 4 8 8 8 8 8\n8 8 8 9 3 3 9 8 8 8 8 1 3 3 1 8 8 3 4 3 3 8 8 8\n8 8 8 3 9 9 3 8 8 8 8 3 1 1 3 8 8 3 4 4 3 8 8 8\n8 8 8 3 9 9 3 8 8 8 8 3 1 1 3 8 8 3 4 4 3 8 8 8\n8 8 8 9 3 3 9 8 8 8 8 1 3 3 1 8 8 3 4 3 3 8 8 8\n8 8 9 8 8 8 8 9 8 8 1 8 8 8 8 1 8 8 4 8 8 8 8 8\n8 9 8 8 8 8 8 8 9 1 8 8 8 8 8 8 1 8 4 8 8 8 8 8\n9 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 1 4 8 8 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 1 4 8 8 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8 8 8\n8 8 8 8 8 8 8 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8 8 8\n8 3 3 3 3 8 8 8 9 1 8 8 8 8 8 8 8 8 8 1 4 8 8 8\n8 3 6 6 6 6 6 6 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8 8\n8 3 6 6 3 8 8 8 6 8 9 1 8 8 8 8 8 8 8 8 1 4 8 8\n8 3 3 3 3 8 8 8 8 6 8 9 1 8 8 8 8 8 8 8 1 4 8 8\n8 8 8 8 8 8 8 8 8 8 6 8 9 1 8 8 8 8 8 8 8 1 4 8\n\nTraining Example 2:\nInput:\n8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8\n8 3 3 8 3 8 8 8\n8 3 4 4 3 8 8 8\n8 3 4 4 8 8 8 8\n8 8 3 3 3 8 8 8\n8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 4 8 8 8 8\n8 8 8 4 8 8 8 8\n8 3 3 4 3 8 8 8\n8 3 4 4 3 8 8 8\n8 3 4 4 4 4 4 4\n8 4 3 3 3 8 8 8\n4 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8\n\nTraining Example 3:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 2 2 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 2 2 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 3 8 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 4 4 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 4 4 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 3 3 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 7 7 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 3 7 7 3 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 8 4\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 8 4 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 8 4 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 2 8 4 8 8 8\n8 8 8 3 3 3 3 8 8 8 8 8 8 2 8 4 8 8 8 8\n8 8 8 3 2 2 2 2 2 2 2 2 2 8 4 8 8 8 8 8\n2 2 2 2 2 2 3 8 8 8 8 8 8 4 8 8 8 8 8 8\n8 8 8 3 3 3 3 8 8 8 8 8 8 4 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 4 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 3 4 3 8 8 8 8 8\n4 4 4 4 4 4 4 4 4 4 4 4 4 4 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 4 4 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 3 3 3 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 3 3 3 3 8 8 8 8 8 8 8 8 8 8 8\n7 7 7 7 7 7 7 7 3 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 3 7 7 3 8 8 8 8 8 8 8 8 8 8 8\n\nTraining Example 4:\nInput:\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 3 8 3 8 8 8 8 8 8 8 8\n8 3 6 6 3 8 8 8 8 8 8 8\n8 3 6 6 3 8 8 8 8 8 8 8\n8 8 3 3 3 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n\nOutput:\n8 8 6 8 8 8 6 8 8 8 8 8\n8 8 6 8 8 6 8 8 8 8 8 8\n8 3 6 3 6 8 8 8 8 8 8 8\n8 3 6 6 3 8 8 8 8 8 8 8\n8 3 6 6 3 8 8 8 8 8 8 8\n8 6 3 3 3 8 8 8 8 8 8 8\n6 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8\n\nTest Input 1:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 8 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 2 2 8 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 2 2 8 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 8 8 0 0 0 0 0\n0 0 0 0 0 8 8 0 0 0 0 8 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 8 3 3 8 0 0 8 4 4 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 8 3 3 8 0 0 8 4 4 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 8 0 8 0 0 0 0 8 0 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 8 8 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 7 7 8 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 7 7 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 8 0 8 8 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTest Input 2:\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 8 3 3 8 8 8 8 8 8 8 8 3 3 3 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 2 2 3 8 8 8 8 8 8 8 3 4 4 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 2 2 3 8 8 8 8 8 8 8 3 4 4 3 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 3 3 3 8 8 8 8 8 8 8 8 3 8 3 3 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 8 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 6 6 3 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 6 6 3 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 7 7 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 7 7 3 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 3 3 3 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n3 3 8 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n3 9 9 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n3 9 9 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n3 3 3 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8 8\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 2, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 2, + 0, + 0, + 0, + 0, + 2, + 0, + 0, + 0 + ], + [ + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 2, + 8, + 8, + 2, + 0, + 0, + 0, + 0 + ], + [ + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 8, + 2, + 2, + 8, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 2, + 2, + 8, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 3, + 0, + 0, + 0, + 0, + 3, + 4, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 2, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 3, + 8, + 8, + 3, + 0, + 0, + 4, + 8, + 8, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 8, + 4, + 4, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 3, + 3, + 8, + 0, + 0, + 8, + 4, + 4, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 3, + 8, + 3, + 0, + 0, + 4, + 8, + 4, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 7, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 7, + 7, + 8, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 7, + 8, + 8, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 3, + 0, + 0, + 3, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 6 + ], + [ + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 6, + 8 + ], + [ + 2, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 6, + 8, + 8 + ], + [ + 8, + 2, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 6, + 8, + 8, + 8 + ], + [ + 9, + 8, + 2, + 3, + 2, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 3, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 6, + 8, + 8, + 8, + 8 + ], + [ + 8, + 9, + 8, + 2, + 2, + 2, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 8, + 6, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 2, + 2, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 4, + 4, + 3, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 3, + 3, + 3, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 4, + 3, + 3, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 8, + 6 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 8, + 6, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8, + 6, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 6, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 6, + 3, + 6, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 8, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 6, + 6, + 3, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 6, + 6, + 3, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 3, + 3, + 3, + 6, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 6, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 3, + 3, + 3, + 3, + 8, + 8, + 8, + 6, + 6 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 3, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 3, + 7, + 7, + 3, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 3, + 3, + 3, + 7, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 8, + 8, + 8 + ], + [ + 3, + 3, + 9, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 8, + 8 + ], + [ + 3, + 9, + 9, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8, + 8 + ], + [ + 3, + 9, + 9, + 3, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7, + 8 + ], + [ + 3, + 3, + 3, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 7 + ], + [ + 8, + 8, + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ], + [ + 8, + 8, + 8, + 8, + 8, + 9, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 2, + 4, + 8, + 8, + 8, + 8, + 8, + 8, + 8 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_e3721c99.json b/problems/arc2_e3721c99.json new file mode 100644 index 0000000..4e01d14 --- /dev/null +++ b/problems/arc2_e3721c99.json @@ -0,0 +1,1932 @@ +{ + "problem_id": "arc2_e3721c99", + "problem_text": "ARC Puzzle: Predict the output grid for each of the 2 test inputs.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 3 3 0 1 1 1 1 1 0 2 2 2 2 2 2 2 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 0 3 0 1 0 1 0 1 0 2 0 2 0 2 0 2 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 3 3 0 1 1 1 1 1 0 2 2 2 2 2 2 2 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 5 5 5 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 5 5 0 5 5 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 5 5 0 5 5 0 5 5 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 5 0 0 0 0\n0 0 0 5 5 5 5 0 0 0 0 0 5 5 0 0 0 0 0 5 5 0 0 0 5 5 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 5 5 0 0 0 5 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 5 5 5 5 0 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0 0\n0 0 0 0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0\n0 0 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 5 0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 5 5 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 5 5 5 5 0 0\n0 0 0 5 5 5 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 5 5 5 0 5 5 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 5 0 5 0 5 0 0 0 0 5 5 5 5 0 0 5 0 0\n0 0 0 0 0 0 5 5 5 5 0 0 5 5 5 5 5 5 0 0 0 5 5 0 5 5 5 5 0 0\n0 0 0 0 0 5 5 5 0 5 0 0 5 0 5 5 5 0 0 0 0 5 5 0 0 5 5 5 0 0\n0 0 0 5 5 5 5 5 0 5 0 0 5 5 5 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0\n0 0 5 5 5 5 0 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 5 5 0 5 0 5 5 5 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0 0\n0 0 5 5 5 5 5 5 5 5 0 0 0 0 0 0 5 5 5 5 5 5 0 0 0 0 0 0 0 0\n0 0 5 5 0 5 5 5 5 0 0 0 0 0 0 0 5 5 5 5 5 5 0 0 0 0 0 0 0 0\n0 0 0 5 5 5 5 5 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 3 3 0 1 1 1 1 1 0 2 2 2 2 2 2 2 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 0 3 0 1 0 1 0 1 0 2 0 2 0 2 0 2 0 0 0 0 0 0 0 0\n0 4 4 4 0 3 3 3 0 1 1 1 1 1 0 2 2 2 2 2 2 2 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 4 4 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 3 3 3 0 0 0 4 4 4 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 3 3 0 3 3 0 4 4 4 4 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 3 3 0 3 3 0 4 4 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 0 0 0 0\n0 0 0 3 3 3 3 0 0 0 0 0 4 4 0 0 0 0 0 1 1 0 0 0 1 1 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 4 4 4 0 0 0 0 1 1 1 1 1 1 1 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 4 4 4 4 4 0 0 0 1 1 0 0 0 1 1 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 4 4 4 4 0 0 0 0 1 1 1 1 1 1 1 0 0 0 0 0 0\n0 0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 1 1 1 0 0 0 0 0 0 0 0 0\n0 0 0 3 3 3 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 3 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 3 3 3 3 0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 1 1 1 1 0 0\n0 0 0 3 3 3 0 0 0 0 0 0 2 2 2 2 2 0 0 0 0 0 1 1 1 0 1 1 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 0 2 0 2 0 0 0 0 1 1 1 1 0 0 1 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 2 2 0 0 0 1 1 0 1 1 1 1 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 0 2 2 2 0 0 0 0 1 1 0 0 1 1 1 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 0 0 0 0 0 0 0 1 1 1 1 1 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 4 4 4 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 4 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 4 4 4 4 4 4 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 4 4 4 0 0 0 0 0 0 0 0 0 0\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 2 2 0 3 3 3 0 1 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0\n0 2 2 2 0 3 0 3 0 1 0 0 0 0 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0 0\n0 2 2 2 0 3 3 3 0 1 0 0 0 5 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 1 0 0 0 5 5 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 1 0 0 0 0 5 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 0 0 0 0 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 0 0\n0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 5 5 5 5 5 5 5 5 0 0\n0 0 0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 5 5 5 0 0 5 5 5 0 0\n0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 5 5 5 5 0\n0 0 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 5 5 5 5 0\n0 0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 5 5 0 0 0 5 5 5 5 0\n0 0 5 5 5 5 5 5 5 0 0 0 5 5 5 5 0 0 0 0 5 5 5 5 5 5 5 5 0 0\n0 5 5 5 5 5 5 5 5 0 0 0 5 5 5 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0\n0 0 5 5 5 5 5 5 0 0 0 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 5 5 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 5 5 0 5 5 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 5 0 0 5 5 0 0 0 0 0\n0 0 0 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 5 0 0 0 0 0 0\n0 0 0 0 5 0 0 5 5 0 0 0 5 0 0 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0\n0 0 0 5 5 0 0 5 0 0 0 5 5 5 5 5 5 5 0 0 5 5 5 5 0 0 0 0 0 0\n0 0 0 5 5 0 5 5 0 0 0 5 0 5 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 5 5 5 5 0 0 0 5 0 5 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 5 0 0 0 0 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 2 2 0 3 3 3 0 1 0 0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 0 0 0\n0 2 2 2 0 3 0 3 0 1 0 0 0 0 2 2 2 2 2 2 2 2 2 2 0 0 0 0 0 0\n0 2 2 2 0 3 3 3 0 1 0 0 0 2 2 2 2 2 2 2 2 2 2 2 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 1 0 0 0 2 2 2 2 2 2 2 2 2 2 2 2 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 1 0 0 0 0 2 2 2 2 2 2 2 2 2 2 2 0 0 0 0 0\n1 1 1 1 1 1 1 1 1 1 0 0 0 0 2 2 2 2 2 2 2 2 2 2 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 2 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 3 3 0 0\n0 0 0 0 0 0 0 0 0 0 2 2 2 0 0 0 0 0 0 0 3 3 3 3 3 3 3 3 0 0\n0 0 0 0 0 0 0 0 0 0 0 2 2 0 0 0 0 0 0 0 3 3 3 0 0 3 3 3 0 0\n0 0 0 0 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 3 3 3 0 0 0 3 3 3 3 0\n0 0 2 2 2 2 2 2 0 0 0 0 0 0 0 0 0 0 0 3 3 3 0 0 0 3 3 3 3 0\n0 0 2 2 2 2 2 2 2 0 0 0 0 0 0 0 0 0 0 0 3 3 0 0 0 3 3 3 3 0\n0 0 2 2 2 2 2 2 2 0 0 0 2 2 2 2 0 0 0 0 3 3 3 3 3 3 3 3 0 0\n0 2 2 2 2 2 2 2 2 0 0 0 2 2 2 0 0 0 0 0 0 3 3 0 0 0 0 0 0 0\n0 0 2 2 2 2 2 2 0 0 0 0 2 2 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 2 2 0 0 0 0 0 2 2 2 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 2 2 2 2 0 0 0 0 0 3 3 3 3 3 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 0 0 0 0 0 3 3 0 3 3 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 2 2 2 0 0 0 0 0 3 0 0 3 3 0 0 0 0 0\n0 0 0 0 3 3 3 3 0 0 0 0 0 0 0 0 0 0 0 0 3 0 0 3 0 0 0 0 0 0\n0 0 0 0 3 0 0 3 3 0 0 0 0 0 0 0 0 0 0 0 3 3 3 3 3 0 0 0 0 0\n0 0 0 3 3 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 3 3 3 3 0 0 0 0 0 0\n0 0 0 3 3 0 3 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 3 3 3 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n\nTest Input 1:\n0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0\n0 0 5 5 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 1 0 8 8 8 0\n0 5 5 5 5 5 5 5 0 5 5 5 0 0 5 5 5 5 5 0 0 0 0 0 1 0 8 0 8 0\n0 5 0 5 5 0 0 5 0 0 0 0 0 5 5 0 0 0 5 0 0 0 0 0 1 0 8 8 8 0\n0 5 0 0 5 0 0 5 0 0 0 0 0 5 0 0 0 0 5 0 5 5 5 0 1 0 8 0 8 0\n0 5 5 5 5 0 0 5 0 0 0 0 0 5 5 0 0 5 5 0 5 0 5 0 1 0 8 8 8 0\n0 0 5 5 5 0 5 5 0 0 0 0 0 0 5 5 5 5 0 0 5 5 5 0 1 0 0 0 0 0\n0 0 0 0 5 5 5 0 0 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 1 0 6 6 6 0\n5 5 0 0 0 0 0 0 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 1 0 6 0 6 0\n5 5 0 0 0 0 0 0 0 5 5 5 5 0 0 0 5 5 5 5 5 5 0 0 1 0 6 6 6 0\n5 5 5 0 0 0 0 0 0 0 5 5 0 0 5 5 5 0 0 5 5 5 5 0 1 0 6 0 6 0\n5 5 5 0 0 5 5 5 0 0 0 0 0 5 5 5 5 0 5 5 0 0 5 0 1 0 6 6 6 0\n5 5 5 0 5 5 0 5 5 5 5 0 0 5 0 0 5 5 5 0 0 0 5 0 1 0 6 0 6 0\n5 5 0 0 5 0 0 0 5 0 5 0 0 5 0 0 0 5 5 5 0 0 5 0 1 0 6 6 6 0\n0 0 0 0 5 5 0 0 5 5 5 0 0 5 5 0 0 5 0 5 5 5 5 0 1 0 6 0 6 0\n0 0 0 0 0 5 5 5 5 5 5 5 0 0 5 5 5 5 0 0 0 5 5 0 1 0 6 6 6 0\n0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 5 5 5 5 0 5 0 0 1 0 0 0 0 0\n0 0 5 5 0 0 0 0 0 0 0 5 5 0 0 0 0 0 0 5 5 5 0 0 1 0 4 4 4 0\n0 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 4 0 4 0\n5 5 5 5 5 5 5 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 1 0 4 4 4 0\n0 5 5 5 5 5 5 0 0 5 5 5 5 0 0 0 5 5 5 5 0 0 0 0 1 0 4 0 4 0\n0 0 0 0 0 0 0 0 0 5 0 0 5 0 0 0 0 0 5 5 5 5 0 0 1 0 4 4 4 0\n0 0 0 0 0 0 0 0 5 5 0 0 5 0 0 0 0 5 5 0 5 5 0 0 1 0 4 0 4 0\n0 5 5 0 0 0 0 5 5 0 0 0 5 0 0 0 5 5 0 0 5 0 0 0 1 0 4 4 4 0\n0 5 5 5 0 0 5 5 5 0 0 0 5 0 0 5 5 0 0 0 5 0 0 0 1 0 4 0 4 0\n0 5 5 5 0 5 5 0 5 5 5 5 5 5 5 5 0 0 0 0 5 0 0 0 1 0 4 4 4 0\n0 5 5 0 0 5 0 0 0 5 5 5 0 5 5 0 0 0 0 0 5 0 0 0 1 0 4 0 4 0\n0 0 0 0 0 5 0 0 0 0 5 0 0 0 5 0 0 0 0 5 5 0 0 0 1 0 4 4 4 0\n0 0 0 0 0 5 5 0 0 0 5 0 0 0 5 0 0 0 5 5 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 5 5 5 5 5 5 5 5 5 5 5 5 5 0 0 0 0 0 1 0 0 0 0 0\n\nTest Input 2:\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 4 4 0 1 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 4 0 4 0 1 0 0 5 5 5 5 5 5 5 5 0 0 0 0 5 5 5 5 5 0 0 0 0 0\n0 4 4 4 0 1 0 0 5 5 5 5 5 0 0 5 0 0 5 5 5 5 0 5 5 0 0 0 0 0\n0 0 0 0 0 1 0 0 5 5 5 5 5 5 5 5 0 0 5 5 5 5 5 5 5 5 0 0 0 0\n0 7 7 7 0 1 0 0 0 0 5 5 5 5 0 0 0 0 5 0 5 5 5 5 5 5 5 0 0 0\n0 7 0 7 0 1 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 5 5 5 5 0 0 0\n0 7 7 7 0 1 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0\n0 7 0 7 0 1 0 0 0 0 0 0 5 5 5 5 0 0 5 5 5 5 5 5 0 0 0 0 0 0\n0 7 7 7 0 1 0 0 0 0 0 0 5 0 0 5 0 0 0 0 0 5 5 0 0 0 5 5 5 5\n0 0 0 0 0 1 0 0 0 0 0 5 5 5 5 5 5 0 0 0 0 0 0 0 0 5 5 5 5 5\n0 2 2 2 0 1 0 0 0 0 5 5 5 0 5 5 5 0 0 0 0 0 0 0 0 5 5 5 5 0\n0 2 0 2 0 1 0 0 0 0 5 5 5 5 5 5 5 0 0 0 0 0 0 0 0 5 5 5 5 0\n0 2 2 2 0 1 0 0 0 0 0 0 5 5 5 5 0 0 0 0 0 0 0 0 0 0 0 5 0 0\n0 2 0 2 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 2 2 2 0 1 0 0 0 0 0 0 0 0 0 0 5 5 0 0 0 0 5 5 5 5 0 0 0 0\n0 2 0 2 0 1 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 5 5 5 0 5 5 5 0 0\n0 2 2 2 0 1 0 0 0 0 0 0 0 0 0 0 5 5 0 0 5 5 5 5 0 5 5 5 0 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 5 0 5 5 5 5 5 5 5 0 0\n0 1 1 1 0 1 0 0 0 5 5 5 5 5 0 0 0 0 0 5 0 0 5 5 5 5 5 0 0 0\n0 1 0 1 0 1 0 5 5 0 0 5 0 5 0 0 0 0 0 5 5 0 0 5 5 5 5 0 0 0\n0 1 1 1 0 1 0 5 5 5 5 5 5 5 5 0 0 0 0 0 5 5 5 5 5 5 5 0 0 0\n0 1 0 1 0 1 0 5 5 5 5 5 5 5 5 0 0 0 0 0 5 5 0 0 5 5 5 0 0 0\n0 1 1 1 0 1 0 5 5 5 5 5 5 5 5 0 0 0 0 0 5 5 0 0 5 5 0 0 0 0\n0 1 0 1 0 1 0 5 5 5 5 5 5 5 5 0 0 0 0 0 5 5 5 5 5 0 0 0 0 0\n0 1 1 1 0 1 0 5 5 5 5 0 0 5 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n0 1 0 1 0 1 0 5 5 0 5 5 5 5 5 0 0 0 5 0 0 0 0 0 0 0 5 5 5 0\n0 1 1 1 0 1 0 0 5 5 5 5 5 5 0 0 0 0 5 5 5 0 0 0 0 0 5 5 5 0\n0 0 0 0 0 1 0 0 0 0 0 5 5 0 0 0 0 5 5 5 5 5 0 0 0 0 5 5 5 0\n0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 5 5 5 0 0 0 0 0 0 0 0 0\n\nFor each test input, give your answer in a numbered tag: for test 1, for test 2, etc.\nUse space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 8, + 8, + 8, + 0 + ], + [ + 0, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 8, + 0, + 8, + 0 + ], + [ + 0, + 8, + 0, + 8, + 8, + 0, + 0, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 8, + 8, + 8, + 0 + ], + [ + 0, + 8, + 0, + 0, + 8, + 0, + 0, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 8, + 0, + 8, + 0 + ], + [ + 0, + 8, + 8, + 8, + 8, + 0, + 0, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 8, + 8, + 8, + 0 + ], + [ + 0, + 0, + 8, + 8, + 8, + 0, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 6, + 6, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 6, + 0, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 6, + 6, + 6, + 0, + 0, + 1, + 0, + 6, + 6, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 0, + 0, + 6, + 6, + 6, + 6, + 0, + 1, + 0, + 6, + 0, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 6, + 0, + 6, + 6, + 0, + 0, + 6, + 0, + 1, + 0, + 6, + 6, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 8, + 0, + 8, + 8, + 8, + 8, + 0, + 0, + 6, + 0, + 0, + 6, + 6, + 6, + 0, + 0, + 0, + 6, + 0, + 1, + 0, + 6, + 0, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 0, + 0, + 0, + 8, + 0, + 8, + 0, + 0, + 6, + 0, + 0, + 0, + 6, + 6, + 6, + 0, + 0, + 6, + 0, + 1, + 0, + 6, + 6, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 8, + 8, + 0, + 0, + 8, + 8, + 8, + 0, + 0, + 6, + 6, + 0, + 0, + 6, + 0, + 6, + 6, + 6, + 6, + 0, + 1, + 0, + 6, + 0, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 8, + 8, + 8, + 8, + 0, + 0, + 6, + 6, + 6, + 6, + 0, + 0, + 0, + 6, + 6, + 0, + 1, + 0, + 6, + 6, + 6, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 8, + 0, + 0, + 0, + 6, + 6, + 6, + 6, + 0, + 6, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 8, + 8, + 0, + 0, + 0, + 0, + 0, + 0, + 6, + 6, + 6, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 1, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 4, + 4, + 0, + 0, + 1, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 4, + 0, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 4, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 1, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 4, + 4, + 0, + 4, + 4, + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 1, + 0, + 4, + 0, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 0, + 1, + 0, + 4, + 4, + 4, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 0, + 0, + 0, + 4, + 4, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0 + ] + ], + [ + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 4, + 4, + 4, + 0, + 1, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 4, + 0, + 4, + 0, + 1, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 4, + 4, + 4, + 0, + 1, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 4, + 0, + 0, + 7, + 7, + 7, + 7, + 0, + 7, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 4, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0 + ], + [ + 0, + 7, + 7, + 7, + 0, + 1, + 0, + 0, + 0, + 0, + 4, + 4, + 4, + 4, + 0, + 0, + 0, + 0, + 7, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0 + ], + [ + 0, + 7, + 0, + 7, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0 + ], + [ + 0, + 7, + 7, + 7, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 7, + 0, + 7, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 7, + 7, + 7, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 2, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 0, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 0, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 2, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 0, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 2, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 0, + 0, + 0, + 0 + ], + [ + 0, + 2, + 0, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 0, + 2, + 2, + 2, + 0, + 0 + ], + [ + 0, + 2, + 2, + 2, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 0, + 2, + 2, + 2, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 0, + 0 + ], + [ + 0, + 1, + 1, + 1, + 0, + 1, + 0, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 0, + 0, + 0 + ], + [ + 0, + 1, + 0, + 1, + 0, + 1, + 0, + 1, + 1, + 0, + 0, + 1, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 0, + 0, + 2, + 2, + 2, + 2, + 0, + 0, + 0 + ], + [ + 0, + 1, + 1, + 1, + 0, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 2, + 2, + 0, + 0, + 0 + ], + [ + 0, + 1, + 0, + 1, + 0, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 0, + 0, + 2, + 2, + 2, + 0, + 0, + 0 + ], + [ + 0, + 1, + 1, + 1, + 0, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 0, + 0, + 2, + 2, + 0, + 0, + 0, + 0 + ], + [ + 0, + 1, + 0, + 1, + 0, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 2, + 2, + 2, + 2, + 2, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 1, + 1, + 1, + 0, + 1, + 0, + 1, + 1, + 1, + 1, + 0, + 0, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 1, + 0, + 1, + 0, + 1, + 0, + 1, + 1, + 0, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 1, + 1, + 1, + 0, + 1, + 0, + 0, + 1, + 1, + 1, + 1, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 1, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file diff --git a/problems/arc2_faa9f03d.json b/problems/arc2_faa9f03d.json new file mode 100644 index 0000000..190fcfd --- /dev/null +++ b/problems/arc2_faa9f03d.json @@ -0,0 +1,178 @@ +{ + "problem_id": "arc2_faa9f03d", + "problem_text": "ARC Puzzle: Predict the test output grid.\n\nTraining Example 1:\nInput:\n0 0 0 0 0 0 0 0 0 3 0 0\n1 1 1 1 0 0 0 0 0 3 0 0\n0 0 0 1 0 0 0 0 0 3 0 0\n2 3 3 3 2 0 0 0 0 3 0 0\n0 0 0 1 3 0 0 0 0 3 0 0\n0 0 0 1 3 1 1 0 0 3 0 0\n0 0 0 0 3 0 1 0 0 3 0 0\n0 0 0 0 3 0 1 0 0 3 0 0\n0 0 0 0 2 3 3 3 0 2 0 0\n0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 1 1 0 1 1 0\n0 0 0 0 0 0 0 0 0 0 1 1\n\nOutput:\n0 0 0 0 0 0 0 0 0 3 0 0\n1 1 1 1 0 0 0 0 0 3 0 0\n0 0 0 1 0 0 0 0 0 3 0 0\n3 3 3 1 3 0 0 0 0 3 0 0\n0 0 0 1 3 0 0 0 0 3 0 0\n0 0 0 1 1 1 1 0 0 3 0 0\n0 0 0 0 3 0 1 0 0 3 0 0\n0 0 0 0 3 0 1 0 0 3 0 0\n0 0 0 0 3 3 1 3 3 3 0 0\n0 0 0 0 0 0 1 0 0 0 0 0\n0 0 0 0 0 0 1 1 1 1 1 0\n0 0 0 0 0 0 0 0 0 0 1 1\n\nTraining Example 2:\nInput:\n0 0 0 0 0 0 0 0 0 0 7 0\n7 7 7 7 0 0 0 0 0 0 7 0\n3 3 3 3 3 0 3 3 3 4 7 0\n0 0 0 7 0 0 0 0 3 0 7 0\n0 0 0 0 0 0 0 0 0 0 7 0\n0 0 0 7 7 7 7 0 3 0 0 0\n0 0 0 0 0 0 7 0 3 0 7 0\n0 0 7 7 7 7 7 0 3 0 7 0\n0 0 7 0 0 0 0 0 3 0 7 0\n3 3 0 3 3 3 3 3 3 0 7 0\n0 0 7 7 7 7 7 7 7 7 7 0\n0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 0 0 0 0 0 0 0 0 0 7 0\n7 7 7 7 0 0 0 0 0 0 7 0\n0 0 0 7 0 0 0 0 3 3 3 3\n0 0 0 7 0 0 0 0 3 0 7 0\n0 0 0 7 0 0 0 0 3 0 7 0\n0 0 0 7 7 7 7 0 3 0 7 0\n0 0 0 0 0 0 7 0 3 0 7 0\n0 0 7 7 7 7 7 0 3 0 7 0\n0 0 7 0 0 0 0 0 3 0 7 0\n3 3 3 3 3 3 3 3 3 0 7 0\n0 0 7 7 7 7 7 7 7 7 7 0\n0 0 0 0 0 0 0 0 0 0 0 0\n\nTraining Example 3:\nInput:\n0 0 7 0 3 0 6 0 0 2 0 0\n0 0 7 0 0 0 0 0 0 1 0 0\n0 0 7 0 3 0 6 0 0 1 0 0\n3 3 7 3 2 0 6 0 0 1 0 0\n0 0 7 0 0 0 6 0 6 1 6 6\n0 0 7 0 0 0 0 0 0 1 0 0\n7 0 7 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 1 0 0\n0 0 0 0 2 1 1 1 1 2 0 0\n0 0 0 0 1 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 1 0 0 0 0 0 0 0\n\nOutput:\n0 0 7 0 3 0 6 0 0 1 0 0\n0 0 7 0 3 0 6 0 0 1 0 0\n0 0 7 0 3 0 6 0 0 1 0 0\n3 3 3 3 3 0 6 0 0 1 0 0\n0 0 7 0 0 0 6 6 6 6 6 6\n0 0 7 0 0 0 0 0 0 1 0 0\n7 7 7 0 0 0 0 0 0 1 0 0\n0 0 0 0 0 0 0 0 0 1 0 0\n0 0 0 0 1 1 1 1 1 1 0 0\n0 0 0 0 1 0 0 0 0 0 0 0\n0 0 0 0 1 0 0 0 0 0 0 0\n0 0 0 0 1 0 0 0 0 0 0 0\n\nTraining Example 4:\nInput:\n0 1 0 0 0 0 1 0 0 0 6 0\n0 1 0 0 0 0 1 0 0 0 6 0\n6 1 6 6 6 6 0 6 0 6 6 0\n0 1 0 0 0 0 1 0 0 0 4 0\n0 0 0 0 0 0 1 0 0 0 0 0\n0 1 1 1 0 1 1 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n\nOutput:\n0 1 0 0 0 0 1 0 0 0 0 0\n0 1 0 0 0 0 1 0 0 0 0 0\n6 1 6 6 6 6 1 6 6 6 6 0\n0 1 0 0 0 0 1 0 0 0 6 0\n0 1 0 0 0 0 1 0 0 0 6 0\n0 1 1 1 1 1 1 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n0 0 0 0 0 0 0 0 0 0 6 0\n\nTest Input:\n0 0 0 0 7 0 0 0 0 0 7 0\n0 0 0 0 7 0 0 0 0 0 7 0\n0 0 0 0 7 0 0 0 0 0 7 0\n4 2 7 7 2 0 0 2 7 7 2 0\n0 7 0 0 0 0 0 7 0 0 4 0\n0 7 0 0 0 0 0 7 0 0 0 0\n0 7 0 0 0 0 0 7 0 0 0 0\n6 6 6 6 6 6 6 0 6 6 6 6\n0 7 0 0 0 0 0 7 0 0 0 0\n0 2 7 7 7 7 7 2 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n0 0 0 0 0 0 0 0 0 0 0 0\n\nGive your answer in ... tags, space-separated values, one row per line.", + "ground_truth": [ + [ + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0 + ], + [ + 7, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 7, + 7, + 7, + 0 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 7, + 0 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 7, + 0 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 7, + 0 + ], + [ + 6, + 7, + 6, + 6, + 6, + 6, + 6, + 7, + 6, + 6, + 7, + 6 + ], + [ + 0, + 7, + 0, + 0, + 0, + 0, + 0, + 7, + 0, + 0, + 7, + 0 + ], + [ + 0, + 7, + 7, + 7, + 7, + 7, + 7, + 7, + 0, + 0, + 7, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0 + ], + [ + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 0, + 7, + 0 + ] + ] + ], + "topic": "arc", + "source": "ARC1-Eval" +} \ No newline at end of file