返回模型
说明文档
实验模型:https://github.com/deepghs/tagger_embedding_aligner
import numpy as np
from imgutils.tagging import get_wd14_tags, convert_wd14_emb_to_prediction, denormalize_wd14_emb
embedding, (r, g, c) = get_wd14_tags(
'/my/image.png',
fmt=('embedding', ('rating', 'general', 'character')),
)
# 正常标签结果
print('预期结果:')
print(r)
print(g)
print(c)
# 归一化嵌入
embedding = embedding / np.linalg.norm(embedding)
# 错误的标签结果
br, bg, bc = convert_wd14_emb_to_prediction(embedding)
print('由于嵌入归一化导致的错误结果:')
print(br)
print(bg)
print(bc)
# 对此嵌入进行反归一化
output = denormalize_wd14_emb(embedding)
print(output.shape)
# 应与 r, g, c 相似,误差约为 1e-3
rating, general, character = convert_wd14_emb_to_prediction(output)
print('反归一化结果:')
print(rating)
print(general)
print(character)
| 名称 | 标签器 | 嵌入维度 | 标签数量 | FLOPS | 参数量 | 嵌入余弦相似度 | 嵌入范数 | 预测损失 | 预测均方误差 |
|---|---|---|---|---|---|---|---|---|---|
| ViT_v3_mnum2_all | ViT_v3 | 768 | 10861 | 0.000398G | 0.40M | 1 | 0.1712 | 0.004306 | 2.116e-08 |
| ViT_v3_mnum1_all | ViT_v3 | 768 | 10861 | 0.000709G | 0.71M | 1 | 0.2246 | 0.004306 | 3.991e-08 |
| ConvNext_v3_mnum2_all | ConvNext_v3 | 1024 | 10861 | 0.000708G | 0.71M | 1 | 0.1126 | 0.004531 | 2.061e-08 |
| ConvNext_v3_mnum1_all | ConvNext_v3 | 1024 | 10861 | 0.001260G | 1.26M | 1 | 0.1473 | 0.004531 | 3.539e-08 |
| ViT_mnum2_all | ViT | 768 | 9083 | 0.000398G | 0.40M | 1 | 0.08641 | 0.005199 | 3.797e-09 |
| ViT_mnum1_all | ViT | 768 | 9083 | 0.000709G | 0.71M | 1 | 0.1724 | 0.005199 | 1.896e-08 |
| ConvNext_mnum2_all | ConvNext | 1024 | 9083 | 0.000708G | 0.71M | 1 | 0.05776 | 0.005213 | 7.207e-09 |
| ConvNext_mnum1_all | ConvNext | 1024 | 9083 | 0.001260G | 1.26M | 1 | 0.07134 | 0.005214 | 1.292e-08 |
| ViT_Large_mnum2_all | ViT_Large | 1024 | 10861 | 0.000708G | 0.71M | 1 | 1.403 | 0.003966 | 1.617e-07 |
| ViT_Large_mnum1_all | ViT_Large | 1024 | 10861 | 0.001260G | 1.26M | 1 | 1.643 | 0.003966 | 2.24e-07 |
| SwinV2_mnum2_all | SwinV2 | 1024 | 9083 | 0.000708G | 0.71M | 1 | 0.1257 | 0.004726 | 3.797e-08 |
| SwinV2_mnum1_all | SwinV2 | 1024 | 9083 | 0.001260G | 1.26M | 1 | 0.1497 | 0.004727 | 5.487e-08 |
| EVA02_Large_mnum2_all | EVA02_Large | 1024 | 10861 | 0.000708G | 0.71M | 1 | 1.268 | 0.005948 | 5.466e-08 |
| EVA02_Large_mnum1_all | EVA02_Large | 1024 | 10861 | 0.001260G | 1.26M | 1 | 1.713 | 0.005948 | 9.518e-08 |
| ConvNextV2_mnum2_all | ConvNextV2 | 1024 | 9083 | 0.000708G | 0.71M | 1 | 0.09014 | 0.004596 | 1.43e-08 |
| ConvNextV2_mnum1_all | ConvNextV2 | 1024 | 9083 | 0.001260G | 1.26M | 1 | 0.1216 | 0.004596 | 2.76e-08 |
| SwinV2_v3_mnum2_all | SwinV2_v3 | 1024 | 10861 | 0.000708G | 0.71M | 1 | 0.2129 | 0.004128 | 4.035e-08 |
| SwinV2_v3_mnum1_all | SwinV2_v3 | 1024 | 10861 | 0.001260G | 1.26M | 1 | 0.2784 | 0.004129 | 6.893e-08 |
| MOAT_mnum2_all | MOAT | 1024 | 9083 | 0.000708G | 0.71M | 1 | 0.4662 | 0.004998 | 1.855e-08 |
| MOAT_mnum1_all | MOAT | 1024 | 9083 | 0.001260G | 1.26M | 1 | 0.7849 | 0.004998 | 5.549e-08 |
deepghs/wd14_tagger_embedding_denormalize
作者 deepghs
feature-extraction
dghs-imgutils
↓ 0
♥ 2
创建时间: 2024-11-12 05:39:10+00:00
更新时间: 2024-11-30 08:42:52+00:00
在 Hugging Face 上查看文件 (122)
.gitattributes
ConvNextV2_mnum1_all/events.out.tfevents.1731467912.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.3434049.4
ConvNextV2_mnum1_all/metrics.json
ConvNextV2_mnum1_all/model.json
ConvNextV2_mnum1_all/model.onnx
ONNX
ConvNextV2_mnum1_all/model.pt
ConvNextV2_mnum1_all/model_with_fc.onnx
ONNX
ConvNextV2_mnum2_all/events.out.tfevents.1731458536.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.3434049.3
ConvNextV2_mnum2_all/metrics.json
ConvNextV2_mnum2_all/model.json
ConvNextV2_mnum2_all/model.onnx
ONNX
ConvNextV2_mnum2_all/model.pt
ConvNextV2_mnum2_all/model_with_fc.onnx
ONNX
ConvNext_mnum1_all/events.out.tfevents.1731486633.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.1
ConvNext_mnum1_all/metrics.json
ConvNext_mnum1_all/model.json
ConvNext_mnum1_all/model.onnx
ONNX
ConvNext_mnum1_all/model.pt
ConvNext_mnum1_all/model_with_fc.onnx
ONNX
ConvNext_mnum2_all/events.out.tfevents.1731477314.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.0
ConvNext_mnum2_all/metrics.json
ConvNext_mnum2_all/model.json
ConvNext_mnum2_all/model.onnx
ONNX
ConvNext_mnum2_all/model.pt
ConvNext_mnum2_all/model_with_fc.onnx
ONNX
ConvNext_v3_mnum1_all/events.out.tfevents.1731524250.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.5
ConvNext_v3_mnum1_all/metrics.json
ConvNext_v3_mnum1_all/model.json
ConvNext_v3_mnum1_all/model.onnx
ONNX
ConvNext_v3_mnum1_all/model.pt
ConvNext_v3_mnum1_all/model_with_fc.onnx
ONNX
ConvNext_v3_mnum2_all/events.out.tfevents.1731513240.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.4
ConvNext_v3_mnum2_all/metrics.json
ConvNext_v3_mnum2_all/model.json
ConvNext_v3_mnum2_all/model.onnx
ONNX
ConvNext_v3_mnum2_all/model.pt
ConvNext_v3_mnum2_all/model_with_fc.onnx
ONNX
EVA02_Large_mnum1_all/events.out.tfevents.1731406771.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.2486943.1
EVA02_Large_mnum1_all/metrics.json
EVA02_Large_mnum1_all/model.json
EVA02_Large_mnum1_all/model.onnx
ONNX
EVA02_Large_mnum1_all/model.pt
EVA02_Large_mnum1_all/model_with_fc.onnx
ONNX
EVA02_Large_mnum2_all/events.out.tfevents.1731396120.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.2486943.0
EVA02_Large_mnum2_all/metrics.json
EVA02_Large_mnum2_all/model.json
EVA02_Large_mnum2_all/model.onnx
ONNX
EVA02_Large_mnum2_all/model.pt
EVA02_Large_mnum2_all/model_with_fc.onnx
ONNX
MOAT_mnum1_all/events.out.tfevents.1731368146.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.1224206.2
MOAT_mnum1_all/metrics.json
MOAT_mnum1_all/model.json
MOAT_mnum1_all/model.onnx
ONNX
MOAT_mnum1_all/model.pt
MOAT_mnum1_all/model_with_fc.onnx
ONNX
MOAT_mnum2_all/events.out.tfevents.1731377678.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.1224206.3
MOAT_mnum2_all/metrics.json
MOAT_mnum2_all/model.json
MOAT_mnum2_all/model.onnx
ONNX
MOAT_mnum2_all/model.pt
MOAT_mnum2_all/model_with_fc.onnx
ONNX
README.md
SwinV2_mnum1_all/events.out.tfevents.1731449244.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.3434049.2
SwinV2_mnum1_all/metrics.json
SwinV2_mnum1_all/model.json
SwinV2_mnum1_all/model.onnx
ONNX
SwinV2_mnum1_all/model.pt
SwinV2_mnum1_all/model_with_fc.onnx
ONNX
SwinV2_mnum2_all/events.out.tfevents.1731439996.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.3434049.1
SwinV2_mnum2_all/metrics.json
SwinV2_mnum2_all/model.json
SwinV2_mnum2_all/model.onnx
ONNX
SwinV2_mnum2_all/model.pt
SwinV2_mnum2_all/model_with_fc.onnx
ONNX
SwinV2_v3_mnum1_all/events.out.tfevents.1731346980.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.1224206.0
SwinV2_v3_mnum1_all/metrics.json
SwinV2_v3_mnum1_all/model.json
SwinV2_v3_mnum1_all/model.onnx
ONNX
SwinV2_v3_mnum1_all/model.pt
SwinV2_v3_mnum1_all/model_with_fc.onnx
ONNX
SwinV2_v3_mnum2_all/events.out.tfevents.1731357825.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.1224206.1
SwinV2_v3_mnum2_all/metrics.json
SwinV2_v3_mnum2_all/model.json
SwinV2_v3_mnum2_all/model.onnx
ONNX
SwinV2_v3_mnum2_all/model.pt
SwinV2_v3_mnum2_all/model_with_fc.onnx
ONNX
ViT_Large_mnum1_all/events.out.tfevents.1731429112.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.3434049.0
ViT_Large_mnum1_all/metrics.json
ViT_Large_mnum1_all/model.json
ViT_Large_mnum1_all/model.onnx
ONNX
ViT_Large_mnum1_all/model.pt
ViT_Large_mnum1_all/model_with_fc.onnx
ONNX
ViT_Large_mnum2_all/events.out.tfevents.1731416951.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.2486943.2
ViT_Large_mnum2_all/metrics.json
ViT_Large_mnum2_all/model.json
ViT_Large_mnum2_all/model.onnx
ONNX
ViT_Large_mnum2_all/model.pt
ViT_Large_mnum2_all/model_with_fc.onnx
ONNX
ViT_mnum1_all/events.out.tfevents.1731504468.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.3
ViT_mnum1_all/metrics.json
ViT_mnum1_all/model.json
ViT_mnum1_all/model.onnx
ONNX
ViT_mnum1_all/model.pt
ViT_mnum1_all/model_with_fc.onnx
ONNX
ViT_mnum2_all/events.out.tfevents.1731495691.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.2
ViT_mnum2_all/metrics.json
ViT_mnum2_all/model.json
ViT_mnum2_all/model.onnx
ONNX
ViT_mnum2_all/model.pt
ViT_mnum2_all/model_with_fc.onnx
ONNX
ViT_v3_mnum1_all/events.out.tfevents.1731545594.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.7
ViT_v3_mnum1_all/metrics.json
ViT_v3_mnum1_all/model.json
ViT_v3_mnum1_all/model.onnx
ONNX
ViT_v3_mnum1_all/model.pt
ViT_v3_mnum1_all/model_with_fc.onnx
ONNX
ViT_v3_mnum2_all/events.out.tfevents.1731534803.99115a8e0b9f5c8a69fc2f5fa0161c8670a7b68fb92c149a211a0a72.756977.6
ViT_v3_mnum2_all/metrics.json
ViT_v3_mnum2_all/model.json
ViT_v3_mnum2_all/model.onnx
ONNX
ViT_v3_mnum2_all/model.pt
ViT_v3_mnum2_all/model_with_fc.onnx
ONNX