ONNX 模型库
返回模型

暂无说明文档

onnxruntime/Gemma-3-ONNX

作者 onnxruntime

↓ 90 ♥ 2

创建时间: 2025-04-18 22:43:50+00:00

更新时间: 2026-02-11 00:11:49+00:00

在 Hugging Face 上查看

文件 (117)

.gitattributes
README.md
config.json
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/chat_template.jinja
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx ONNX
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx.data
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx ONNX
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx.data
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx ONNX
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx.data
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/processor_config.json
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx ONNX
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx ONNX
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx ONNX
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/genai_config.json
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/processor_config.json
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer.json
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer_config.json
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx ONNX
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx ONNX
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx ONNX
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/genai_config.json
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/processor_config.json
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer.json
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer_config.json
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/chat_template.jinja
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx ONNX
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx.data
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx ONNX
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx.data
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx ONNX
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx.data
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/processor_config.json
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx ONNX
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx ONNX
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx ONNX
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/genai_config.json
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/processor_config.json
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer.json
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer_config.json
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx ONNX
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx ONNX
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx ONNX
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/genai_config.json
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/processor_config.json
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer.json
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer_config.json
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/chat_template.jinja
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx ONNX
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx.data
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx ONNX
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx.data
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx ONNX
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx.data
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/processor_config.json
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx ONNX
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx ONNX
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx ONNX
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/genai_config.json
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/processor_config.json
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer.json
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer_config.json
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx ONNX
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx ONNX
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx ONNX
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/genai_config.json
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/processor_config.json
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer.json
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer_config.json
onnx/12b/config.json
onnx/27b/config.json
onnx/4b/config.json
onnx/builder.py
onnx/configuration_gemma3.py
onnx/modeling_gemma3.py