mirror of
https://github.com/dogkeeper886/ollama37.git
synced 2025-12-22 13:46:59 +00:00
Change workflow defaults: judge_mode=dual, judge_model=gemma3:12b
This commit is contained in:
40
.github/workflows/build.yml
vendored
40
.github/workflows/build.yml
vendored
@@ -1,33 +1,33 @@
|
||||
name: Build Verification
|
||||
|
||||
on:
|
||||
workflow_dispatch: # Manual trigger
|
||||
workflow_dispatch: # Manual trigger
|
||||
inputs:
|
||||
judge_mode:
|
||||
description: 'Test judge mode'
|
||||
description: "Test judge mode"
|
||||
required: false
|
||||
default: 'simple'
|
||||
default: "dual"
|
||||
type: choice
|
||||
options:
|
||||
- 'simple'
|
||||
- 'llm'
|
||||
- 'dual'
|
||||
- "simple"
|
||||
- "llm"
|
||||
- "dual"
|
||||
judge_model:
|
||||
description: 'LLM model for judging (if llm/dual mode)'
|
||||
description: "LLM model for judging (if llm/dual mode)"
|
||||
required: false
|
||||
default: 'gemma3:4b'
|
||||
default: "gemma3:12b"
|
||||
type: string
|
||||
workflow_call: # Called by other workflows
|
||||
workflow_call: # Called by other workflows
|
||||
inputs:
|
||||
judge_mode:
|
||||
description: 'Test judge mode (simple, llm, dual)'
|
||||
description: "Test judge mode (simple, llm, dual)"
|
||||
required: false
|
||||
default: 'simple'
|
||||
default: "dual"
|
||||
type: string
|
||||
judge_model:
|
||||
description: 'LLM model for judging'
|
||||
description: "LLM model for judging"
|
||||
required: false
|
||||
default: 'gemma3:4b'
|
||||
default: "gemma3:12b"
|
||||
type: string
|
||||
outputs:
|
||||
result:
|
||||
@@ -51,7 +51,7 @@ jobs:
|
||||
- name: Setup Node.js
|
||||
uses: actions/setup-node@v4
|
||||
with:
|
||||
node-version: '20'
|
||||
node-version: "20"
|
||||
|
||||
- name: Install test runner dependencies
|
||||
run: cd tests && npm ci
|
||||
@@ -63,16 +63,16 @@ jobs:
|
||||
|
||||
# Build judge flags based on input
|
||||
JUDGE_FLAGS=""
|
||||
if [ "${{ inputs.judge_mode }}" = "simple" ] || [ -z "${{ inputs.judge_mode }}" ]; then
|
||||
if [ "${{ inputs.judge_mode }}" = "simple" ]; then
|
||||
JUDGE_FLAGS="--no-llm"
|
||||
elif [ "${{ inputs.judge_mode }}" = "dual" ]; then
|
||||
JUDGE_FLAGS="--dual-judge --judge-model ${{ inputs.judge_model || 'gemma3:4b' }}"
|
||||
elif [ "${{ inputs.judge_mode }}" = "llm" ]; then
|
||||
JUDGE_FLAGS="--judge-model ${{ inputs.judge_model || 'gemma3:12b' }}"
|
||||
else
|
||||
# llm mode
|
||||
JUDGE_FLAGS="--judge-model ${{ inputs.judge_model || 'gemma3:4b' }}"
|
||||
# dual mode (default)
|
||||
JUDGE_FLAGS="--dual-judge --judge-model ${{ inputs.judge_model || 'gemma3:12b' }}"
|
||||
fi
|
||||
|
||||
echo "Judge mode: ${{ inputs.judge_mode || 'simple' }}"
|
||||
echo "Judge mode: ${{ inputs.judge_mode || 'dual' }}"
|
||||
echo "Judge flags: $JUDGE_FLAGS"
|
||||
|
||||
# Progress goes to stderr (visible), JSON results go to file
|
||||
|
||||
Reference in New Issue
Block a user