Skip to content

Commit a3057ff

Browse files
committed
update evaluate
1 parent 0d35236 commit a3057ff

16 files changed

+67134
-231
lines changed

.github/workflows/evaluations.yaml

+3-3
Original file line numberDiff line numberDiff line change
@@ -63,16 +63,16 @@ jobs:
6363
inlineScript: |
6464
az account set --subscription ${{env.AZURE_SUBSCRIPTION_ID}}
6565
66-
- name: evaluate orchestrator
66+
- name: evaluate
6767
working-directory: ./src/api
6868
run: |
69-
python -m evaluate.evaluate
69+
python -m evaluators.evaluate
7070
7171
- name: Upload eval results as build artifact
7272
uses: actions/upload-artifact@v4
7373
with:
7474
name: eval_result
75-
path: ./src/api/evaluate/eval_results.jsonl
75+
path: ./src/api/evaluators/eval_results.jsonl
7676

7777
- name: GitHub Summary Step
7878
if: ${{ success() }}

.gitignore

+13-7
Original file line numberDiff line numberDiff line change
@@ -11,14 +11,20 @@ deployment/push_and_deploy_pf.py
1111
endpoint.json
1212
principal.txt
1313
.azure
14-
evaluations/process_log/
15-
evaluations/flow.flex.yaml
16-
evaluations/eval_result.**
17-
evaluations/studio_url.txt
14+
evaluators/process_log/
15+
evaluators/flow.flex.yaml
16+
evaluators/eval_result.**
17+
evaluators/studio_url.txt
1818
src/contoso_chat/.runs/*
1919
src/api/contoso_chat/.runs/*
2020
src/api/.runs/*
2121
.runs/*
22-
evaluations/.runs/*
23-
evaluations/result_evaluated.jsonl
24-
evaluations/result.jsonl
22+
evaluators/.runs/*
23+
evaluators/result_evaluated.jsonl
24+
evaluators/result.jsonl
25+
src/api/evaluators/.runs/*
26+
src/api/evaluators/result_evaluated.jsonl
27+
src/api/evaluators/result.jsonl
28+
src/api/evaluators/eval_results.jsonl
29+
src/api/evaluators/eval_results.md
30+
src/api/evaluators/.runs/*

evaluations/.promptflow/relevance/flow.tools.json

-25
This file was deleted.

evaluations/evaluate-chat-flow.ipynb

-143
This file was deleted.

evaluations/evaluate.py

-53
This file was deleted.
File renamed without changes.
File renamed without changes.

0 commit comments

Comments
 (0)