Files

1000 lines
34 KiB
JSON

{
"benchmark": "HumanEval",
"version": "1.0",
"timestamp": "2026-01-05T00:49:17.745476",
"model": "opus",
"timeout_per_problem": 300,
"total_problems": 164,
"status": "COMPLETED",
"problems": [
{
"task_id": "HumanEval/0",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/0.py"
},
{
"task_id": "HumanEval/1",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/1.py"
},
{
"task_id": "HumanEval/2",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/2.py"
},
{
"task_id": "HumanEval/3",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/3.py"
},
{
"task_id": "HumanEval/4",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/4.py"
},
{
"task_id": "HumanEval/5",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/5.py"
},
{
"task_id": "HumanEval/6",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/6.py"
},
{
"task_id": "HumanEval/7",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/7.py"
},
{
"task_id": "HumanEval/8",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/8.py"
},
{
"task_id": "HumanEval/9",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/9.py"
},
{
"task_id": "HumanEval/10",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/10.py"
},
{
"task_id": "HumanEval/11",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/11.py"
},
{
"task_id": "HumanEval/12",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/12.py"
},
{
"task_id": "HumanEval/13",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/13.py"
},
{
"task_id": "HumanEval/14",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/14.py"
},
{
"task_id": "HumanEval/15",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/15.py"
},
{
"task_id": "HumanEval/16",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/16.py"
},
{
"task_id": "HumanEval/17",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/17.py"
},
{
"task_id": "HumanEval/18",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/18.py"
},
{
"task_id": "HumanEval/19",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/19.py"
},
{
"task_id": "HumanEval/20",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/20.py"
},
{
"task_id": "HumanEval/21",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/21.py"
},
{
"task_id": "HumanEval/22",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/22.py"
},
{
"task_id": "HumanEval/23",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/23.py"
},
{
"task_id": "HumanEval/24",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/24.py"
},
{
"task_id": "HumanEval/25",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/25.py"
},
{
"task_id": "HumanEval/26",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/26.py"
},
{
"task_id": "HumanEval/27",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/27.py"
},
{
"task_id": "HumanEval/28",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/28.py"
},
{
"task_id": "HumanEval/29",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/29.py"
},
{
"task_id": "HumanEval/30",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/30.py"
},
{
"task_id": "HumanEval/31",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/31.py"
},
{
"task_id": "HumanEval/32",
"passed": false,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/32.py"
},
{
"task_id": "HumanEval/33",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/33.py"
},
{
"task_id": "HumanEval/34",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/34.py"
},
{
"task_id": "HumanEval/35",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/35.py"
},
{
"task_id": "HumanEval/36",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/36.py"
},
{
"task_id": "HumanEval/37",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/37.py"
},
{
"task_id": "HumanEval/38",
"passed": false,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/38.py"
},
{
"task_id": "HumanEval/39",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/39.py"
},
{
"task_id": "HumanEval/40",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/40.py"
},
{
"task_id": "HumanEval/41",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/41.py"
},
{
"task_id": "HumanEval/42",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/42.py"
},
{
"task_id": "HumanEval/43",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/43.py"
},
{
"task_id": "HumanEval/44",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/44.py"
},
{
"task_id": "HumanEval/45",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/45.py"
},
{
"task_id": "HumanEval/46",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/46.py"
},
{
"task_id": "HumanEval/47",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/47.py"
},
{
"task_id": "HumanEval/48",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/48.py"
},
{
"task_id": "HumanEval/49",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/49.py"
},
{
"task_id": "HumanEval/50",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/50.py"
},
{
"task_id": "HumanEval/51",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/51.py"
},
{
"task_id": "HumanEval/52",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/52.py"
},
{
"task_id": "HumanEval/53",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/53.py"
},
{
"task_id": "HumanEval/54",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/54.py"
},
{
"task_id": "HumanEval/55",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/55.py"
},
{
"task_id": "HumanEval/56",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/56.py"
},
{
"task_id": "HumanEval/57",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/57.py"
},
{
"task_id": "HumanEval/58",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/58.py"
},
{
"task_id": "HumanEval/59",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/59.py"
},
{
"task_id": "HumanEval/60",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/60.py"
},
{
"task_id": "HumanEval/61",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/61.py"
},
{
"task_id": "HumanEval/62",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/62.py"
},
{
"task_id": "HumanEval/63",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/63.py"
},
{
"task_id": "HumanEval/64",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/64.py"
},
{
"task_id": "HumanEval/65",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/65.py"
},
{
"task_id": "HumanEval/66",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/66.py"
},
{
"task_id": "HumanEval/67",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/67.py"
},
{
"task_id": "HumanEval/68",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/68.py"
},
{
"task_id": "HumanEval/69",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/69.py"
},
{
"task_id": "HumanEval/70",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/70.py"
},
{
"task_id": "HumanEval/71",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/71.py"
},
{
"task_id": "HumanEval/72",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/72.py"
},
{
"task_id": "HumanEval/73",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/73.py"
},
{
"task_id": "HumanEval/74",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/74.py"
},
{
"task_id": "HumanEval/75",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/75.py"
},
{
"task_id": "HumanEval/76",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/76.py"
},
{
"task_id": "HumanEval/77",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/77.py"
},
{
"task_id": "HumanEval/78",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/78.py"
},
{
"task_id": "HumanEval/79",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/79.py"
},
{
"task_id": "HumanEval/80",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/80.py"
},
{
"task_id": "HumanEval/81",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/81.py"
},
{
"task_id": "HumanEval/82",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/82.py"
},
{
"task_id": "HumanEval/83",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/83.py"
},
{
"task_id": "HumanEval/84",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/84.py"
},
{
"task_id": "HumanEval/85",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/85.py"
},
{
"task_id": "HumanEval/86",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/86.py"
},
{
"task_id": "HumanEval/87",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/87.py"
},
{
"task_id": "HumanEval/88",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/88.py"
},
{
"task_id": "HumanEval/89",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/89.py"
},
{
"task_id": "HumanEval/90",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/90.py"
},
{
"task_id": "HumanEval/91",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/91.py"
},
{
"task_id": "HumanEval/92",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/92.py"
},
{
"task_id": "HumanEval/93",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/93.py"
},
{
"task_id": "HumanEval/94",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/94.py"
},
{
"task_id": "HumanEval/95",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/95.py"
},
{
"task_id": "HumanEval/96",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/96.py"
},
{
"task_id": "HumanEval/97",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/97.py"
},
{
"task_id": "HumanEval/98",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/98.py"
},
{
"task_id": "HumanEval/99",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/99.py"
},
{
"task_id": "HumanEval/100",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/100.py"
},
{
"task_id": "HumanEval/101",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/101.py"
},
{
"task_id": "HumanEval/102",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/102.py"
},
{
"task_id": "HumanEval/103",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/103.py"
},
{
"task_id": "HumanEval/104",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/104.py"
},
{
"task_id": "HumanEval/105",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/105.py"
},
{
"task_id": "HumanEval/106",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/106.py"
},
{
"task_id": "HumanEval/107",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/107.py"
},
{
"task_id": "HumanEval/108",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/108.py"
},
{
"task_id": "HumanEval/109",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/109.py"
},
{
"task_id": "HumanEval/110",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/110.py"
},
{
"task_id": "HumanEval/111",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/111.py"
},
{
"task_id": "HumanEval/112",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/112.py"
},
{
"task_id": "HumanEval/113",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/113.py"
},
{
"task_id": "HumanEval/114",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/114.py"
},
{
"task_id": "HumanEval/115",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/115.py"
},
{
"task_id": "HumanEval/116",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/116.py"
},
{
"task_id": "HumanEval/117",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/117.py"
},
{
"task_id": "HumanEval/118",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/118.py"
},
{
"task_id": "HumanEval/119",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/119.py"
},
{
"task_id": "HumanEval/120",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/120.py"
},
{
"task_id": "HumanEval/121",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/121.py"
},
{
"task_id": "HumanEval/122",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/122.py"
},
{
"task_id": "HumanEval/123",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/123.py"
},
{
"task_id": "HumanEval/124",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/124.py"
},
{
"task_id": "HumanEval/125",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/125.py"
},
{
"task_id": "HumanEval/126",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/126.py"
},
{
"task_id": "HumanEval/127",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/127.py"
},
{
"task_id": "HumanEval/128",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/128.py"
},
{
"task_id": "HumanEval/129",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/129.py"
},
{
"task_id": "HumanEval/130",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/130.py"
},
{
"task_id": "HumanEval/131",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/131.py"
},
{
"task_id": "HumanEval/132",
"passed": false,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/132.py"
},
{
"task_id": "HumanEval/133",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/133.py"
},
{
"task_id": "HumanEval/134",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/134.py"
},
{
"task_id": "HumanEval/135",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/135.py"
},
{
"task_id": "HumanEval/136",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/136.py"
},
{
"task_id": "HumanEval/137",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/137.py"
},
{
"task_id": "HumanEval/138",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/138.py"
},
{
"task_id": "HumanEval/139",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/139.py"
},
{
"task_id": "HumanEval/140",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/140.py"
},
{
"task_id": "HumanEval/141",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/141.py"
},
{
"task_id": "HumanEval/142",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/142.py"
},
{
"task_id": "HumanEval/143",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/143.py"
},
{
"task_id": "HumanEval/144",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/144.py"
},
{
"task_id": "HumanEval/145",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/145.py"
},
{
"task_id": "HumanEval/146",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/146.py"
},
{
"task_id": "HumanEval/147",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/147.py"
},
{
"task_id": "HumanEval/148",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/148.py"
},
{
"task_id": "HumanEval/149",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/149.py"
},
{
"task_id": "HumanEval/150",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/150.py"
},
{
"task_id": "HumanEval/151",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/151.py"
},
{
"task_id": "HumanEval/152",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/152.py"
},
{
"task_id": "HumanEval/153",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/153.py"
},
{
"task_id": "HumanEval/154",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/154.py"
},
{
"task_id": "HumanEval/155",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/155.py"
},
{
"task_id": "HumanEval/156",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/156.py"
},
{
"task_id": "HumanEval/157",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/157.py"
},
{
"task_id": "HumanEval/158",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/158.py"
},
{
"task_id": "HumanEval/159",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/159.py"
},
{
"task_id": "HumanEval/160",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/160.py"
},
{
"task_id": "HumanEval/161",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/161.py"
},
{
"task_id": "HumanEval/162",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/162.py"
},
{
"task_id": "HumanEval/163",
"passed": true,
"error": null,
"solution_file": "/Users/lokesh/git/loki-mode/benchmarks/results/2026-01-05-00-49-17/humaneval-solutions/163.py"
}
],
"passed": 161,
"failed": 3,
"errors": 0,
"pass_rate": 98.17,
"elapsed_seconds": 1263.46
}