Skip to content

Commit 9fe5044

Browse files
author
Jiawen Sun
committed
Merge branch 'main' of https://github.com/microsoft/BC-Bench into master_thesis
2 parents bf728d4 + ee09540 commit 9fe5044

31 files changed

Lines changed: 1096 additions & 287 deletions

.github/workflows/CI.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ jobs:
1919

2020
steps:
2121
- name: Checkout repository
22-
uses: actions/checkout@v4
22+
uses: actions/checkout@v5
2323

2424
- name: Setup Python with UV
2525
uses: ./.github/actions/setup-python-uv
@@ -63,7 +63,7 @@ jobs:
6363
name: Test Run for ${{ matrix.entry }}
6464
steps:
6565
- name: Checkout repository
66-
uses: actions/checkout@v4
66+
uses: actions/checkout@v5
6767

6868
- name: Setup Python with UV
6969
uses: ./.github/actions/setup-python-uv
@@ -72,7 +72,7 @@ jobs:
7272
run: uv run bcbench evaluate mock "${{ matrix.entry }}" --category ${{ needs.select-category.outputs.category }} --output-dir evaluation_results --run-id ${{ github.run_id }}
7373

7474
- name: Upload mock evaluation results
75-
uses: actions/upload-artifact@v4
75+
uses: actions/upload-artifact@v6
7676
with:
7777
name: ${{ matrix.entry }}
7878
path: ${{ env.EVALUATION_RESULTS_DIR }}/

.github/workflows/claude-evaluation.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -77,7 +77,7 @@ jobs:
7777
entry: ${{ fromJson(needs.get-entries.outputs.entries) }}
7878
steps:
7979
- name: Checkout repository
80-
uses: actions/checkout@v4
80+
uses: actions/checkout@v5
8181

8282
- name: Setup BC container
8383
id: setup-env
@@ -99,14 +99,14 @@ jobs:
9999
- name: Install AL Tool
100100
if: ${{ inputs.al-mcp }}
101101
run: |
102-
dotnet tool install -g Microsoft.Dynamics.BusinessCentral.Development.Tools --version 18.0.33.30146-beta
102+
dotnet tool install -g Microsoft.Dynamics.BusinessCentral.Development.Tools --version 17.0.33.55542
103103
echo "$HOME\.dotnet\tools" >> $env:GITHUB_PATH
104104
105105
- name: Install Claude Code
106106
run: npm install -g @anthropic-ai/claude-code@2.1.69
107107

108108
- name: Run Claude Code for entry ${{ matrix.entry }}
109-
timeout-minutes: 90
109+
timeout-minutes: 120
110110
env:
111111
ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }}
112112
run: |
@@ -118,7 +118,7 @@ jobs:
118118
${{ inputs.al-mcp && '--al-mcp' || '' }}
119119
120120
- name: Upload evaluation results
121-
uses: actions/upload-artifact@v4
121+
uses: actions/upload-artifact@v6
122122
if: always()
123123
with:
124124
name: evaluation-results-${{ github.run_id }}-${{ matrix.entry }}

.github/workflows/copilot-evaluation.yml

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -85,7 +85,7 @@ jobs:
8585
entry: ${{ fromJson(needs.get-entries.outputs.entries) }}
8686
steps:
8787
- name: Checkout repository
88-
uses: actions/checkout@v4
88+
uses: actions/checkout@v5
8989

9090
- name: Setup BC container
9191
id: setup-env
@@ -107,7 +107,7 @@ jobs:
107107
- name: Install AL Tool
108108
if: ${{ inputs.al-mcp }}
109109
run: |
110-
dotnet tool install -g Microsoft.Dynamics.BusinessCentral.Development.Tools --version 18.0.33.30146-beta
110+
dotnet tool install -g Microsoft.Dynamics.BusinessCentral.Development.Tools --version 17.0.33.55542
111111
echo "$HOME\.dotnet\tools" >> $env:GITHUB_PATH
112112
113113
- name: Install GitHub Copilot CLI
@@ -120,9 +120,9 @@ jobs:
120120
echo "pat_index=$patIndex" >> $env:GITHUB_OUTPUT
121121
122122
- name: Run GitHub Copilot CLI for entry ${{ matrix.entry }}
123-
timeout-minutes: 90
123+
timeout-minutes: 120
124124
env:
125-
GH_TOKEN: ${{ steps.select-pat.outputs.pat_index == '0' && secrets.COPILOT_PAT || (steps.select-pat.outputs.pat_index == '1' && secrets.COPILOT_PAT2 || secrets.COPILOT_PAT3) }}
125+
COPILOT_GITHUB_TOKEN: ${{ steps.select-pat.outputs.pat_index == '0' && secrets.COPILOT_PAT || (steps.select-pat.outputs.pat_index == '1' && secrets.COPILOT_PAT2 || secrets.COPILOT_PAT3) }}
126126
run: |
127127
uv run bcbench evaluate copilot "${{ matrix.entry }}" `
128128
--model "${{ inputs.model }}" `
@@ -132,7 +132,7 @@ jobs:
132132
${{ inputs.al-mcp && '--al-mcp' || '' }}
133133
134134
- name: Upload evaluation results
135-
uses: actions/upload-artifact@v4
135+
uses: actions/upload-artifact@v6
136136
if: always()
137137
with:
138138
name: evaluation-results-${{ github.run_id }}-${{ matrix.entry }}

.github/workflows/copilot-setup-steps.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@ jobs:
1818

1919
steps:
2020
- name: Checkout code
21-
uses: actions/checkout@v4
21+
uses: actions/checkout@v5
2222

2323
- name: Install uv
2424
uses: astral-sh/setup-uv@v7

.github/workflows/dataset-validation.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -38,7 +38,7 @@ jobs:
3838
entry: ${{ fromJson(needs.get-entries.outputs.entries) }}
3939
steps:
4040
- name: Checkout repository
41-
uses: actions/checkout@v4
41+
uses: actions/checkout@v5
4242

4343
- name: Setup BC container
4444
id: setup-env

.github/workflows/get-entries.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@ jobs:
3232
entries: ${{ steps.get-entries.outputs.entries }}
3333
steps:
3434
- name: Checkout repository
35-
uses: actions/checkout@v4
35+
uses: actions/checkout@v5
3636
with:
3737
fetch-depth: ${{ inputs.modified-only && '0' || '1' }}
3838

.github/workflows/mini-evaluation.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -57,7 +57,7 @@ jobs:
5757
entry: ${{ fromJson(needs.get-entries.outputs.entries) }}
5858
steps:
5959
- name: Checkout repository
60-
uses: actions/checkout@v4
60+
uses: actions/checkout@v5
6161

6262
- name: Setup BC container
6363
id: setup-env
@@ -93,7 +93,7 @@ jobs:
9393
--output-dir "${{ env.EVALUATION_RESULTS_DIR }}"
9494
9595
- name: Upload evaluation results
96-
uses: actions/upload-artifact@v4
96+
uses: actions/upload-artifact@v6
9797
if: always()
9898
with:
9999
name: evaluation-results-${{ github.run_id }}-${{ matrix.entry }}

.github/workflows/summarize-results.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,7 @@ jobs:
3939
runs-on: ubuntu-latest
4040
steps:
4141
- name: Checkout repository
42-
uses: actions/checkout@v4
42+
uses: actions/checkout@v5
4343

4444
- name: Setup Python with UV
4545
uses: ./.github/actions/setup-python-uv
@@ -54,7 +54,7 @@ jobs:
5454
run: uv run bcbench result summarize --result-dir "${{ inputs.results-dir }}" --bceval-output "${{ env.BCEVAL_RESULT_FILE }}" --summary-output "${{ env.SUMMARY_OUTPUT_FILE }}"
5555

5656
- name: Upload evaluation summary to artifacts
57-
uses: actions/upload-artifact@v4
57+
uses: actions/upload-artifact@v6
5858
with:
5959
name: evaluation-summary
6060
path: ${{ inputs.results-dir }}/${{ github.run_id }}/${{ env.SUMMARY_OUTPUT_FILE }}
-2.57 KB
Loading
-4.97 KB
Loading

0 commit comments

Comments
 (0)