gemma3 quantization (#9776)

This commit is contained in:
Patrick Devine
2025-03-14 17:41:07 -07:00
committed by GitHub
parent 2d2247e59e
commit ef378ad673
5 changed files with 149 additions and 0 deletions

View File

@@ -41,6 +41,7 @@ enum llm_arch {
LLM_ARCH_MINICPM3,
LLM_ARCH_GEMMA,
LLM_ARCH_GEMMA2,
LLM_ARCH_GEMMA3,
LLM_ARCH_STARCODER2,
LLM_ARCH_MAMBA,
LLM_ARCH_XVERSE,