ONNX 模型库
返回模型

说明文档

实验模型:https://github.com/deepghs/tagger_embedding_aligner

import numpy as np

from imgutils.tagging import get_wd14_tags, convert_wd14_emb_to_prediction, denormalize_wd14_emb

embedding, (r, g, c) = get_wd14_tags(
    '/my/image.png',
    fmt=('embedding', ('rating', 'general', 'character')),
)
# 正常标签结果
print('预期结果:')
print(r)
print(g)
print(c)

# 归一化嵌入
embedding = embedding / np.linalg.norm(embedding)
# 错误的标签结果
br, bg, bc = convert_wd14_emb_to_prediction(embedding)
print('由于嵌入归一化导致的错误结果:')
print(br)
print(bg)
print(bc)

# 对此嵌入进行反归一化
output = denormalize_wd14_emb(embedding)
print(output.shape)

# 应与 r, g, c 相似,误差约为 1e-3
rating, general, character = convert_wd14_emb_to_prediction(output)
print('反归一化结果:')
print(rating)
print(general)
print(character)
名称 标签器 嵌入维度 标签数量 FLOPS 参数量 嵌入余弦相似度 嵌入范数 预测损失 预测均方误差
ViT_v3_mnum2_all ViT_v3 768 10861 0.000398G 0.40M 1 0.1712 0.004306 2.116e-08
ViT_v3_mnum1_all ViT_v3 768 10861 0.000709G 0.71M 1 0.2246 0.004306 3.991e-08
ConvNext_v3_mnum2_all ConvNext_v3 1024 10861 0.000708G 0.71M 1 0.1126 0.004531 2.061e-08
ConvNext_v3_mnum1_all ConvNext_v3 1024 10861 0.001260G 1.26M 1 0.1473 0.004531 3.539e-08
ViT_mnum2_all ViT 768 9083 0.000398G 0.40M 1 0.08641 0.005199 3.797e-09
ViT_mnum1_all ViT 768 9083 0.000709G 0.71M 1 0.1724 0.005199 1.896e-08
ConvNext_mnum2_all ConvNext 1024 9083 0.000708G 0.71M 1 0.05776 0.005213 7.207e-09
ConvNext_mnum1_all ConvNext 1024 9083 0.001260G 1.26M 1 0.07134 0.005214 1.292e-08
ViT_Large_mnum2_all ViT_Large 1024 10861 0.000708G 0.71M 1 1.403 0.003966 1.617e-07
ViT_Large_mnum1_all ViT_Large 1024 10861 0.001260G 1.26M 1 1.643 0.003966 2.24e-07
SwinV2_mnum2_all SwinV2 1024 9083 0.000708G 0.71M 1 0.1257 0.004726 3.797e-08
SwinV2_mnum1_all SwinV2 1024 9083 0.001260G 1.26M 1 0.1497 0.004727 5.487e-08
EVA02_Large_mnum2_all EVA02_Large 1024 10861 0.000708G 0.71M 1 1.268 0.005948 5.466e-08
EVA02_Large_mnum1_all EVA02_Large 1024 10861 0.001260G 1.26M 1 1.713 0.005948 9.518e-08
ConvNextV2_mnum2_all ConvNextV2 1024 9083 0.000708G 0.71M 1 0.09014 0.004596 1.43e-08
ConvNextV2_mnum1_all ConvNextV2 1024 9083 0.001260G 1.26M 1 0.1216 0.004596 2.76e-08
SwinV2_v3_mnum2_all SwinV2_v3 1024 10861 0.000708G 0.71M 1 0.2129 0.004128 4.035e-08
SwinV2_v3_mnum1_all SwinV2_v3 1024 10861 0.001260G 1.26M 1 0.2784 0.004129 6.893e-08
MOAT_mnum2_all MOAT 1024 9083 0.000708G 0.71M 1 0.4662 0.004998 1.855e-08
MOAT_mnum1_all MOAT 1024 9083 0.001260G 1.26M 1 0.7849 0.004998 5.549e-08

deepghs/wd14_tagger_embedding_denormalize

作者 deepghs

feature-extraction dghs-imgutils
↓ 0 ♥ 2

创建时间: 2024-11-12 05:39:10+00:00

更新时间: 2024-11-30 08:42:52+00:00

在 Hugging Face 上查看

文件 (122)

.gitattributes
ConvNextV2_mnum1_all/events.out.tfevents.1731467912.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.3434049.4
ConvNextV2_mnum1_all/metrics.json
ConvNextV2_mnum1_all/model.json
ConvNextV2_mnum1_all/model.onnx ONNX
ConvNextV2_mnum1_all/model.pt
ConvNextV2_mnum1_all/model_with_fc.onnx ONNX
ConvNextV2_mnum2_all/events.out.tfevents.1731458536.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.3434049.3
ConvNextV2_mnum2_all/metrics.json
ConvNextV2_mnum2_all/model.json
ConvNextV2_mnum2_all/model.onnx ONNX
ConvNextV2_mnum2_all/model.pt
ConvNextV2_mnum2_all/model_with_fc.onnx ONNX
ConvNext_mnum1_all/events.out.tfevents.1731486633.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.1
ConvNext_mnum1_all/metrics.json
ConvNext_mnum1_all/model.json
ConvNext_mnum1_all/model.onnx ONNX
ConvNext_mnum1_all/model.pt
ConvNext_mnum1_all/model_with_fc.onnx ONNX
ConvNext_mnum2_all/events.out.tfevents.1731477314.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.0
ConvNext_mnum2_all/metrics.json
ConvNext_mnum2_all/model.json
ConvNext_mnum2_all/model.onnx ONNX
ConvNext_mnum2_all/model.pt
ConvNext_mnum2_all/model_with_fc.onnx ONNX
ConvNext_v3_mnum1_all/events.out.tfevents.1731524250.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.5
ConvNext_v3_mnum1_all/metrics.json
ConvNext_v3_mnum1_all/model.json
ConvNext_v3_mnum1_all/model.onnx ONNX
ConvNext_v3_mnum1_all/model.pt
ConvNext_v3_mnum1_all/model_with_fc.onnx ONNX
ConvNext_v3_mnum2_all/events.out.tfevents.1731513240.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.4
ConvNext_v3_mnum2_all/metrics.json
ConvNext_v3_mnum2_all/model.json
ConvNext_v3_mnum2_all/model.onnx ONNX
ConvNext_v3_mnum2_all/model.pt
ConvNext_v3_mnum2_all/model_with_fc.onnx ONNX
EVA02_Large_mnum1_all/events.out.tfevents.1731406771.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.2486943.1
EVA02_Large_mnum1_all/metrics.json
EVA02_Large_mnum1_all/model.json
EVA02_Large_mnum1_all/model.onnx ONNX
EVA02_Large_mnum1_all/model.pt
EVA02_Large_mnum1_all/model_with_fc.onnx ONNX
EVA02_Large_mnum2_all/events.out.tfevents.1731396120.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.2486943.0
EVA02_Large_mnum2_all/metrics.json
EVA02_Large_mnum2_all/model.json
EVA02_Large_mnum2_all/model.onnx ONNX
EVA02_Large_mnum2_all/model.pt
EVA02_Large_mnum2_all/model_with_fc.onnx ONNX
MOAT_mnum1_all/events.out.tfevents.1731368146.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.1224206.2
MOAT_mnum1_all/metrics.json
MOAT_mnum1_all/model.json
MOAT_mnum1_all/model.onnx ONNX
MOAT_mnum1_all/model.pt
MOAT_mnum1_all/model_with_fc.onnx ONNX
MOAT_mnum2_all/events.out.tfevents.1731377678.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.1224206.3
MOAT_mnum2_all/metrics.json
MOAT_mnum2_all/model.json
MOAT_mnum2_all/model.onnx ONNX
MOAT_mnum2_all/model.pt
MOAT_mnum2_all/model_with_fc.onnx ONNX
README.md
SwinV2_mnum1_all/events.out.tfevents.1731449244.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.3434049.2
SwinV2_mnum1_all/metrics.json
SwinV2_mnum1_all/model.json
SwinV2_mnum1_all/model.onnx ONNX
SwinV2_mnum1_all/model.pt
SwinV2_mnum1_all/model_with_fc.onnx ONNX
SwinV2_mnum2_all/events.out.tfevents.1731439996.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.3434049.1
SwinV2_mnum2_all/metrics.json
SwinV2_mnum2_all/model.json
SwinV2_mnum2_all/model.onnx ONNX
SwinV2_mnum2_all/model.pt
SwinV2_mnum2_all/model_with_fc.onnx ONNX
SwinV2_v3_mnum1_all/events.out.tfevents.1731346980.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.1224206.0
SwinV2_v3_mnum1_all/metrics.json
SwinV2_v3_mnum1_all/model.json
SwinV2_v3_mnum1_all/model.onnx ONNX
SwinV2_v3_mnum1_all/model.pt
SwinV2_v3_mnum1_all/model_with_fc.onnx ONNX
SwinV2_v3_mnum2_all/events.out.tfevents.1731357825.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.1224206.1
SwinV2_v3_mnum2_all/metrics.json
SwinV2_v3_mnum2_all/model.json
SwinV2_v3_mnum2_all/model.onnx ONNX
SwinV2_v3_mnum2_all/model.pt
SwinV2_v3_mnum2_all/model_with_fc.onnx ONNX
ViT_Large_mnum1_all/events.out.tfevents.1731429112.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.3434049.0
ViT_Large_mnum1_all/metrics.json
ViT_Large_mnum1_all/model.json
ViT_Large_mnum1_all/model.onnx ONNX
ViT_Large_mnum1_all/model.pt
ViT_Large_mnum1_all/model_with_fc.onnx ONNX
ViT_Large_mnum2_all/events.out.tfevents.1731416951.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.2486943.2
ViT_Large_mnum2_all/metrics.json
ViT_Large_mnum2_all/model.json
ViT_Large_mnum2_all/model.onnx ONNX
ViT_Large_mnum2_all/model.pt
ViT_Large_mnum2_all/model_with_fc.onnx ONNX
ViT_mnum1_all/events.out.tfevents.1731504468.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.3
ViT_mnum1_all/metrics.json
ViT_mnum1_all/model.json
ViT_mnum1_all/model.onnx ONNX
ViT_mnum1_all/model.pt
ViT_mnum1_all/model_with_fc.onnx ONNX
ViT_mnum2_all/events.out.tfevents.1731495691.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.2
ViT_mnum2_all/metrics.json
ViT_mnum2_all/model.json
ViT_mnum2_all/model.onnx ONNX
ViT_mnum2_all/model.pt
ViT_mnum2_all/model_with_fc.onnx ONNX
ViT_v3_mnum1_all/events.out.tfevents.1731545594.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.7
ViT_v3_mnum1_all/metrics.json
ViT_v3_mnum1_all/model.json
ViT_v3_mnum1_all/model.onnx ONNX
ViT_v3_mnum1_all/model.pt
ViT_v3_mnum1_all/model_with_fc.onnx ONNX
ViT_v3_mnum2_all/events.out.tfevents.1731534803.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.6
ViT_v3_mnum2_all/metrics.json
ViT_v3_mnum2_all/model.json
ViT_v3_mnum2_all/model.onnx ONNX
ViT_v3_mnum2_all/model.pt
ViT_v3_mnum2_all/model_with_fc.onnx ONNX