{
    "version": "b9010",
    "description": "Inference of LLaMA model in pure C/C++ (SYCL version)",
    "homepage": "https://github.com/ggml-org/llama.cpp",
    "license": "MIT",
    "architecture": {
        "64bit": {
            "url": "https://github.com/ggml-org/llama.cpp/releases/download/b9010/llama-b9010-bin-win-sycl-x64.zip",
            "hash": "a979b0cb4f2111510b434a9b16a5a2edaab5425ed1bb3881085909bb7945203d"
        }
    },
    "bin": [
        "llama-batched-bench.exe",
        "llama-bench.exe",
        "llama-cli.exe",
        "llama-completion.exe",
        "llama-fit-params.exe",
        "llama-gemma3-cli.exe",
        "llama-gguf-split.exe",
        "llama-imatrix.exe",
        "llama-llava-cli.exe",
        "llama-minicpmv-cli.exe",
        "llama-mtmd-cli.exe",
        "llama-perplexity.exe",
        "llama-quantize.exe",
        "llama-qwen2vl-cli.exe",
        "llama-server.exe",
        "llama-tokenize.exe",
        "llama-tts.exe"
    ],
    "persist": "models",
    "checkver": {
        "github": "https://github.com/ggml-org/llama.cpp",
        "regex": "/releases/tag/(b[\\d]+)"
    },
    "autoupdate": {
        "architecture": {
            "64bit": {
                "url": "https://github.com/ggml-org/llama.cpp/releases/download/$version/llama-$version-bin-win-sycl-x64.zip"
            }
        }
    }
}