mirror of
https://github.com/dogkeeper886/ollama37.git
synced 2025-12-22 05:37:01 +00:00
Change workflow defaults: judge_mode=dual, judge_model=gemma3:12b
This commit is contained in:
50
.github/workflows/runtime.yml
vendored
50
.github/workflows/runtime.yml
vendored
@@ -1,46 +1,46 @@
|
||||
name: Runtime Tests
|
||||
|
||||
on:
|
||||
workflow_dispatch: # Manual trigger
|
||||
workflow_dispatch: # Manual trigger
|
||||
inputs:
|
||||
keep_container:
|
||||
description: 'Keep container running after tests'
|
||||
description: "Keep container running after tests"
|
||||
required: false
|
||||
default: 'false'
|
||||
default: "false"
|
||||
type: choice
|
||||
options:
|
||||
- 'true'
|
||||
- 'false'
|
||||
- "true"
|
||||
- "false"
|
||||
judge_mode:
|
||||
description: 'Test judge mode'
|
||||
description: "Test judge mode"
|
||||
required: false
|
||||
default: 'simple'
|
||||
default: "dual"
|
||||
type: choice
|
||||
options:
|
||||
- 'simple'
|
||||
- 'llm'
|
||||
- 'dual'
|
||||
- "simple"
|
||||
- "llm"
|
||||
- "dual"
|
||||
judge_model:
|
||||
description: 'LLM model for judging (if llm/dual mode)'
|
||||
description: "LLM model for judging (if llm/dual mode)"
|
||||
required: false
|
||||
default: 'gemma3:4b'
|
||||
default: "gemma3:12b"
|
||||
type: string
|
||||
workflow_call: # Called by other workflows
|
||||
workflow_call: # Called by other workflows
|
||||
inputs:
|
||||
keep_container:
|
||||
description: 'Keep container running for subsequent jobs'
|
||||
description: "Keep container running for subsequent jobs"
|
||||
required: false
|
||||
default: false
|
||||
type: boolean
|
||||
judge_mode:
|
||||
description: 'Test judge mode (simple, llm, dual)'
|
||||
description: "Test judge mode (simple, llm, dual)"
|
||||
required: false
|
||||
default: 'simple'
|
||||
default: "dual"
|
||||
type: string
|
||||
judge_model:
|
||||
description: 'LLM model for judging'
|
||||
description: "LLM model for judging"
|
||||
required: false
|
||||
default: 'gemma3:4b'
|
||||
default: "gemma3:12b"
|
||||
type: string
|
||||
outputs:
|
||||
result:
|
||||
@@ -61,7 +61,7 @@ jobs:
|
||||
- name: Setup Node.js
|
||||
uses: actions/setup-node@v4
|
||||
with:
|
||||
node-version: '20'
|
||||
node-version: "20"
|
||||
|
||||
- name: Install test runner dependencies
|
||||
run: cd tests && npm ci
|
||||
@@ -80,16 +80,16 @@ jobs:
|
||||
|
||||
# Build judge flags based on input
|
||||
JUDGE_FLAGS=""
|
||||
if [ "${{ inputs.judge_mode }}" = "simple" ] || [ -z "${{ inputs.judge_mode }}" ]; then
|
||||
if [ "${{ inputs.judge_mode }}" = "simple" ]; then
|
||||
JUDGE_FLAGS="--no-llm"
|
||||
elif [ "${{ inputs.judge_mode }}" = "dual" ]; then
|
||||
JUDGE_FLAGS="--dual-judge --judge-model ${{ inputs.judge_model || 'gemma3:4b' }}"
|
||||
elif [ "${{ inputs.judge_mode }}" = "llm" ]; then
|
||||
JUDGE_FLAGS="--judge-model ${{ inputs.judge_model || 'gemma3:12b' }}"
|
||||
else
|
||||
# llm mode
|
||||
JUDGE_FLAGS="--judge-model ${{ inputs.judge_model || 'gemma3:4b' }}"
|
||||
# dual mode (default)
|
||||
JUDGE_FLAGS="--dual-judge --judge-model ${{ inputs.judge_model || 'gemma3:12b' }}"
|
||||
fi
|
||||
|
||||
echo "Judge mode: ${{ inputs.judge_mode || 'simple' }}"
|
||||
echo "Judge mode: ${{ inputs.judge_mode || 'dual' }}"
|
||||
echo "Judge flags: $JUDGE_FLAGS"
|
||||
|
||||
# Progress goes to stderr (visible), JSON results go to file
|
||||
|
||||
Reference in New Issue
Block a user