Skip to content

[Feature] add mtbench #55

[Feature] add mtbench

[Feature] add mtbench #55

Workflow file for this run

name: pr_run_test
on:
pull_request:
paths-ignore:
- 'README.md'
- 'README_zh-CN.md'
- 'docs/**'
- 'configs/**'
- 'tools/**'
workflow_dispatch:
schedule:
- cron: '56 0 * * *'
concurrency:
group: ${{ github.workflow }}-${{ github.ref }}
cancel-in-progress: true
jobs:
test_run:
runs-on: self-hosted
timeout-minutes: 20
strategy:
matrix:
python-version: ['3.10']
steps:
- name: Clone repository
uses: actions/checkout@v2
- name: Prepare - Clone Conde Env install and copy data
run: |
eval "$(conda shell.bash hook)"
conda create --name opencompass_regression --clone opencompass_base
conda activate opencompass_regression
python3 -m pip install -e .
cp -r /cpfs01/user/qa-llm-cicd/data .
rm -rf ~/.cache/huggingface/hub -f && mkdir ~/.cache -p && mkdir ~/.cache/huggingface -p
ln -s /cpfs01/shared/public/public_hdd/llmeval/model_weights/hf_hub ~/.cache/huggingface/hub
conda info --envs
- name: Run test
run: |
eval "$(conda shell.bash hook)"
conda activate opencompass_regression
conda info --envs
rm -rf regression_result
python3 run.py --models hf_internlm_chat_7b --datasets siqa_gen --work-dir regression_result --debug
- name: Remove Conda Env
run: |
eval "$(conda shell.bash hook)"
conda env remove --name opencompass_regression
conda info --envs
- name: Get result
run: |
score=$(sed -n '$p' regression_result/*/summary/*.csv | awk -F ',' '{print $NF}')
if (( ${score%.*} >= 70 && ${score%.*} <= 80 )); then
echo "score is $score between 70 and 80"
else
echo "score is $score not between 70 and 80"
exit 1
fi
rm -rf regression_result