Find Commit Date

L3
ModelContextProtocolGithubBuild Your Own X

Find when Voxel Engine entries were first created by Daniel Stefanovic and document the date.

Created by Xiangyan Liu
2025-08-15
Repository Analysis

Model Ranking

Click on the dots to view the trajectory of each task run
Model
Run Results
Pass@4
Pass^4
Avg Time
Avg Turns
Input Tokens
Output Tokens
Total Tokens
Claude
claude-4-1-opus
0
/1
--
101.4s
5.0
258,338
680
259,018
Claude
claude-4-sonnet
0
/4
60.4s
3.8
89,580
564
90,144
DeepSeek
deepseek-chat
0
/4
66.1s
3.8
125,972
291
126,263
Gemini
gemini-2-5-pro
0
/4
80.0s
3.0
25,923
7,236
33,158
OpenAI
gpt-5
0
/4
138.2s
3.3
360,446
3,944
364,389
Grok
grok-4
0
/4
30.4s
-
-
-
-
MoonshotAI
k2
0
/4
101.5s
3.0
52,754
314
53,067
OpenAI
o3
0
/4
90.3s
5.0
508,663
2,132
510,795
Qwen
qwen-3-coder
0
/4
119.1s
8.0
680,268
732
681,000

Task State


Instruction



Verify

*.py
Python
import sys
import os
import requests
from typing import Dict, Optional, Tuple
import base64
from dotenv import load_dotenv


def _get_github_api(
    endpoint: str, headers: Dict[str, str], org: str, repo: str = "build-your-own-x"
) -> Tuple[bool, Optional[Dict]]:
    """Make a GET request to GitHub API and return (success, response)."""
    url = f"https://api.github.com/repos/{org}/{repo}/{endpoint}"
    try:
        response = requests.get(url, headers=headers)
        if response.status_code == 200:
            return True, response.json()
        elif response.status_code == 404:
            return False, None
        else:
            print(f"API error for {endpoint}: {response.status_code}", file=sys.stderr)
            return False, None
    except Exception as e:
        print(f"Exception for {endpoint}: {e}", file=sys.stderr)
        return False, None


def _get_file_content(
    file_path: str,
    headers: Dict[str, str],
    org: str,
    repo: str = "build-your-own-x",
    ref: str = "master",
) -> Optional[str]:
    """Get the content of a file from the repository."""
    success, result = _get_github_api(
        f"contents/{file_path}?ref={ref}", headers, org, repo
    )
    if not success or not result:
        return None

    try:
        content = base64.b64decode(result.get("content", "")).decode("utf-8")
        return content
    except Exception as e:
        print(f"Content decode error for {file_path}: {e}", file=sys.stderr)
        return None


def verify_task() -> bool:
    """Verify the find commit data task for Voxel Engine entries."""
    # Load environment variables from .mcp_env
    load_dotenv(".mcp_env")

    # Get GitHub token and org
    github_token = os.environ.get("MCP_GITHUB_TOKEN")
    github_org = os.environ.get("GITHUB_EVAL_ORG")

    if not github_token:
        print("Error: MCP_GITHUB_TOKEN environment variable not set", file=sys.stderr)
        return False

    if not github_org:
        print("Error: GITHUB_EVAL_ORG environment variable not set", file=sys.stderr)
        return False

    headers = {
        "Authorization": f"Bearer {github_token}",
        "Accept": "application/vnd.github.v3+json",
    }

    print("Verifying Voxel Engine commit date task...")

    # 1. Check if ANSWER.md exists in the repository
    print("1. Checking if ANSWER.md exists...")
    content = _get_file_content("ANSWER.md", headers, github_org)
    if not content:
        print("Error: ANSWER.md not found in repository", file=sys.stderr)
        return False
    print("✓ ANSWER.md found")

    # 2. Check the content format
    print("2. Checking content format...")
    content = content.strip()
    
    # The expected date when Daniel Stefanovic added Voxel Engine entries
    # Based on historical records, this should be 2018-07-07
    expected_date = "2018-07-07"
    
    # Check if the content matches the expected date format (YYYY-MM-DD)
    import re
    date_pattern = r'^\d{4}-\d{2}-\d{2}$'
    if not re.match(date_pattern, content):
        print(f"Error: Invalid date format. Expected YYYY-MM-DD, got: {content}", file=sys.stderr)
        return False
    print("✓ Date format is correct")

    # 3. Verify the date is correct
    print("3. Verifying the date...")
    if content != expected_date:
        print(f"Error: Incorrect date. Expected {expected_date}, got: {content}", file=sys.stderr)
        return False
    print(f"✓ Date is correct: {content}")

    # 4. Verify README.md contains Voxel Engine section
    print("4. Checking if README.md contains Voxel Engine section...")
    readme_content = _get_file_content("README.md", headers, github_org)
    if not readme_content:
        print("Error: README.md not found in repository", file=sys.stderr)
        return False
    
    if "Voxel Engine" not in readme_content:
        print("Error: Voxel Engine section not found in README.md", file=sys.stderr)
        return False
    
    # Check for specific Voxel Engine entries
    voxel_entries = [
        "Let's Make a Voxel Engine",
        "Java Voxel Engine Tutorial"
    ]
    
    for entry in voxel_entries:
        if entry not in readme_content:
            print(f"Warning: Voxel Engine entry '{entry}' not found in README.md", file=sys.stderr)
    
    print("✓ Voxel Engine section found in README.md")

    print("\n✅ All verification checks passed!")
    print("Task completed successfully:")
    print(f"  - ANSWER.md created with date: {content}")
    print("  - Date format is correct (YYYY-MM-DD)")
    print("  - Date matches expected creation date for Voxel Engine entries by Daniel Stefanovic")
    print("  - Voxel Engine section exists in README.md")

    return True


if __name__ == "__main__":
    success = verify_task()
    sys.exit(0 if success else 1)