返回模型
暂无说明文档
onnxruntime/Gemma-3-ONNX
作者 onnxruntime
↓ 90
♥ 2
创建时间: 2025-04-18 22:43:50+00:00
更新时间: 2026-02-11 00:11:49+00:00
在 Hugging Face 上查看文件 (117)
.gitattributes
README.md
config.json
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/chat_template.jinja
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx
ONNX
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx.data
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx
ONNX
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx.data
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx
ONNX
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx.data
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/processor_config.json
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json
gemma-3-12b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx
ONNX
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx
ONNX
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx
ONNX
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/genai_config.json
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/processor_config.json
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer.json
gemma-3-12b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer_config.json
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx
ONNX
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx
ONNX
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx
ONNX
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/genai_config.json
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/processor_config.json
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer.json
gemma-3-12b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer_config.json
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/chat_template.jinja
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx
ONNX
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx.data
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx
ONNX
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx.data
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx
ONNX
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx.data
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/processor_config.json
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json
gemma-3-27b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx
ONNX
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx
ONNX
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx
ONNX
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/genai_config.json
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/processor_config.json
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer.json
gemma-3-27b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer_config.json
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx
ONNX
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx
ONNX
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx
ONNX
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/genai_config.json
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/processor_config.json
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer.json
gemma-3-27b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer_config.json
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/chat_template.jinja
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx
ONNX
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-embedding.onnx.data
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx
ONNX
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-text.onnx.data
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx
ONNX
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/gemma-3-vision.onnx.data
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/processor_config.json
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json
gemma-3-4b-it/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx
ONNX
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx
ONNX
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx
ONNX
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/genai_config.json
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/processor_config.json
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer.json
gemma-3-4b-it/gpu/cuda-bf16-io-int4-rtn-block-32/tokenizer_config.json
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/chat_template.jinja
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx
ONNX
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-embedding.onnx.data
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx
ONNX
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-text.onnx.data
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx
ONNX
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/gemma-3-vision.onnx.data
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/genai_config.json
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/processor_config.json
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/special_tokens_map.json
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer.json
gemma-3-4b-it/gpu/gpu-fp16-io-int4-rtn-block-32/tokenizer_config.json
onnx/12b/config.json
onnx/27b/config.json
onnx/4b/config.json
onnx/builder.py
onnx/configuration_gemma3.py
onnx/modeling_gemma3.py