mirrored 18 minutes ago
0
MillanKpatch: minor bug fixes for evaluator and task configurations, documentation update (#121) * fix: /cursor_position api return format fix * chore: update README.md to remove deprecated command * fix: add base score for evaluators and minor bug fixes * fix: add base score for setup configurations --------- Co-authored-by: Jiaqi Deng <jiaqideng@Jiaqis-MacBook-Pro.local>983283a
{
    "id": "c2751594-0cd5-4088-be1b-b5f2f9ec97c4",
    "snapshot": "thunderbird",
    "instruction": "Help me export the first image from the doc file attached in the most recent email in Notes folder, and set this image as the new desktop background.",
    "source": "authors",
    "config": [
        {
            "type": "download",
            "parameters": {
                "files": [
                    {
                        "url": "https://drive.usercontent.google.com/download?id=1JcDjBGBP5ly90pdVLs3ySoe6qX9Ht_d6&export=download&authuser=0&confirm=t",
                        "path": "/home/user/thunderbird-profile.tar.gz"
                    }
                ]
            }
        },
        {
            "type": "execute",
            "parameters": {
                "command": [
                    "tar",
                    "--recursive-unlink",
                    "-xz",
                    "-f",
                    "/home/user/thunderbird-profile.tar.gz",
                    "-C",
                    "/home/user/"
                ]
            }
        },
        {
            "type": "launch",
            "parameters": {
                "command": [
                    "/usr/bin/thunderbird"
                ]
            }
        }
    ],
    "trajectory": "trajectories/",
    "related_apps": [
        "thunderbird",
        "os"
    ],
    "evaluator": {
        "func": "compare_images",
        "result": {
            "type": "vm_wallpaper",
            "dest": "background.png"
        },
        "expected": {
            "type": "cloud_file",
            "path": "https://drive.usercontent.google.com/download?id=1iIdjmXD6fRSYtpqxujTGzx8agvIgXsqz&export=download&authuser=0&confirm=t",
            "dest": "gold_background.png"
        },
        "options": {
            "reference_base_result": 0.54
        }
    }
}