{"version":"1.0","workflow_uuid":"7fd5858d-76a8-4679-80d1-ee1191ad2977","workflow_title":"SWE-bench — Benchmark for Coding Agents","install_contract":{"version":"1.0","installReady":false,"title":"SWE-bench — Benchmark for Coding Agents","summary":"Evaluate coding agents on real GitHub issues with SWE-bench, including a harness to run and score patch predictions. Compare models and tool stacks.","assetType":"Knowledge","pageUrl":"","sourceUrl":"https://github.com/SWE-bench/SWE-bench","intendedFor":[],"firstActions":[],"agentFirstSteps":[],"targetPaths":[],"verification":[],"startingPoints":[],"example":"","successOutcome":"","boundaries":[],"askUserIf":["the current workspace stack cannot be matched to a safe upstream template","the target path is not the project root, or an existing file should be merged instead of overwritten"]}}