Skip to content

Commit 94e4eeb

Browse files
haoranpbCopilot
andauthored
update copilot and refresh models (#584)
Co-authored-by: Copilot <198982749+Copilot@users.noreply.github.com>
1 parent 504e2ab commit 94e4eeb

5 files changed

Lines changed: 5 additions & 12 deletions

File tree

.github/workflows/copilot-evaluation.yml

Lines changed: 2 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -18,14 +18,11 @@ on:
1818
- "claude-opus-4.5"
1919
- "claude-opus-4.6"
2020
- "claude-opus-4.6-fast"
21+
- "gpt-5.4"
2122
- "gpt-5.3-codex"
2223
- "gpt-5.2-codex"
2324
- "gpt-5.2"
24-
- "gpt-5.1-codex-mini"
25-
- "gpt-5.1-codex"
26-
- "gpt-5.1-codex-max"
2725
- "gpt-4.1"
28-
- "gemini-3-pro-preview"
2926
category:
3027
description: "Evaluation category to run"
3128
required: false
@@ -115,7 +112,7 @@ jobs:
115112
run: dotnet tool install Microsoft.Dynamics.BusinessCentral.Development.Tools --version 17.0.30.49729-beta --global
116113

117114
- name: Install GitHub Copilot CLI
118-
run: npm install -g @github/copilot@0.0.411
115+
run: npm install -g @github/copilot@1.0.2
119116

120117
- name: Select PAT based on job index
121118
id: select-pat

pyproject.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
44

55
[project]
66
name = "bcbench"
7-
version = "0.3.0"
7+
version = "0.3.1"
88
description = "Benchmarking tool for Business Central (AL) ecosystem, inspired by SWE-Bench"
99
readme = "README.md"
1010
requires-python = ">=3.13"

src/bcbench/agent/copilot/agent.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -58,7 +58,6 @@ def run_copilot_agent(entry: DatasetEntry, model: str, category: EvaluationCateg
5858
"--disable-builtin-mcps",
5959
f"--model={model}",
6060
"--log-level=debug",
61-
"--disable-parallel-tools-execution",
6261
f"--log-dir={output_dir.resolve()}",
6362
f"-p={prompt.replace('\r', '').replace('\n', ' ')}",
6463
]

src/bcbench/cli_options.py

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -35,14 +35,11 @@
3535
"claude-opus-4.5",
3636
"claude-opus-4.6",
3737
"claude-opus-4.6-fast",
38+
"gpt-5.4",
3839
"gpt-5.3-codex",
3940
"gpt-5.2-codex",
4041
"gpt-5.2",
41-
"gpt-5.1-codex-mini",
42-
"gpt-5.1-codex",
43-
"gpt-5.1-codex-max",
4442
"gpt-4.1",
45-
"gemini-3-pro-preview",
4643
],
4744
typer.Option(help="Copilot model to use"),
4845
]

uv.lock

Lines changed: 1 addition & 1 deletion
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

0 commit comments

Comments
 (0)