返回模型
说明文档

from tokenizers import Tokenizer
import onnxruntime as ort
import numpy as np

reranker_tokenizer = Tokenizer.from_file('./tokenizer.json')
reranker_session = ort.InferenceSession('./model.onnx')

def rerank(question, passages, normalize_scores=True):
    # 格式化输入模板
    templates = [f\"Query: {question}\nSentence: {passage}\" for passage in passages]
    encoded_inputs = reranker_tokenizer.encode_batch(templates)

    # 转换为列表并将序列截断到最大长度（32768）
    input_ids = [enc.ids[:32768] for enc in encoded_inputs]  # 在此处截断
    attention_mask = [[1] * len(ids) for ids in input_ids]

    # 找到批次中的最大长度
    batch_max_length = max(len(ids) for ids in input_ids)  # 已截断至 <=512

    # 填充序列
    def pad_sequence(seq, pad_value=0):
        return seq + [pad_value] * (batch_max_length - len(seq))

    input_ids = np.array([pad_sequence(ids) for ids in input_ids], dtype=np.int64)
    attention_mask = np.array([pad_sequence(mask, pad_value=0) for mask in attention_mask], dtype=np.int64)

    # 创建ONNX输入字典
    inputs_onnx = {
        \"input_ids\": input_ids,
        \"attention_mask\": attention_mask
    }

    # 运行ONNX模型
    outputs = reranker_session.run(None, inputs_onnx)
    logits = outputs[0]

    # 应用softmax获取概率
    probabilities = np.exp(logits) / np.sum(np.exp(logits), axis=1, keepdims=True)

    # 获取预测类别和置信度分数
    predicted_classes = np.argmax(probabilities, axis=1).tolist()
    confidences = np.max(probabilities, axis=1).tolist()

    results = [
        {\"passage\": passage, \"prediction\": pred, \"confidence\": conf}
        for passage, pred, conf in zip(passages, predicted_classes, confidences)
    ]

    final_results = []
    for document, result in zip(passages, results):
        # 如果预测结果为0，调整置信度分数
        if result['prediction'] == 0:
            result['confidence'] = 1 - result['confidence']
        final_results.append((document, result['confidence']))
    
    # 按置信度分数降序排序
    sorted_results = sorted(final_results, key=lambda x: x[1], reverse=True)

    # 如果需要，对分数进行归一化
    if normalize_scores:
        total_score = sum(result[1] for result in sorted_results)
        if total_score > 0:
            sorted_results = [(result[0], result[1] / total_score) for result in sorted_results]

    return sorted_results

question = \"O que é o Pantanal?\"
passages = [
    \"É um dos ecossistemas mais ricos em biodiversidade do mundo, abrigando uma grande variedade de espécies animais e vegetais.\",
    \"Sua beleza natural, com rios e lagos interligados, atrai turistas de todo o mundo.\",
    \"O Pantanal sofre com impactos ambientais, como a exploração mineral e o desmatamento.\",
    \"O Pantanal é uma extensa planície alagável localizada na América do Sul, principalmente no Brasil, mas também em partes da Bolívia e Paraguai.\",
    \"É um local com importância histórica e cultural para as populações locais.\",
    \"O Pantanal é um importante habitat para diversas espécies de animais, inclusive aves migratórias.\"
]
ranked_results = rerank(question, passages, normalize_scores=True)
ranked_results
# [('O Pantanal é uma extensa planície alagável localizada na América do Sul, principalmente no Brasil, mas também em partes da Bolívia e Paraguai.',
#   0.7105862286443647),
#  ('O Pantanal é um importante habitat para diversas espécies de animais, inclusive aves migratórias.',
#   0.22660008031497725),
#  ('O Pantanal sofre com impactos ambientais, como a exploração mineral e o desmatamento.',
#   0.043374300040060654),
#  ('É um local com importância histórica e cultural para as populações locais.',
#   0.0070428120274147726),
#  ('É um dos ecossistemas mais ricos em biodiversidade do mundo, abrigando uma grande variedade de espécies animais e vegetais.',
#   0.006359544027065005),
#  ('Sua beleza natural, com rios e lagos interligados, atrai turistas de todo o mundo.',
#   0.006037034946117598)]

question = \"What is the speed of light?\"
passages = [
    \"Isaac Newton's laws of motion and gravity laid the groundwork for classical mechanics.\",
    \"The theory of relativity, proposed by Albert Einstein, has revolutionized our understanding of space, time, and gravity.\",
    \"The Earth orbits the Sun at an average distance of about 93 million miles, taking roughly 365.25 days to complete one revolution.\",
    \"The speed of light in a vacuum is approximately 299,792 kilometers per second (km/s), or about 186,282 miles per second.\",
    \"Light can be described as both a wave and a particle, a concept known as wave-particle duality.\"
]
ranked_results = rerank(question, passages, normalize_scores=True)
ranked_results
# [('The speed of light in a vacuum is approximately 299,792 kilometers per second (km/s), or about 186,282 miles per second.',
#   0.5686758878772575),
#  ('The theory of relativity, proposed by Albert Einstein, has revolutionized our understanding of space, time, and gravity.',
#   0.14584055128478327),
#  ('The Earth orbits the Sun at an average distance of about 93 million miles, taking roughly 365.25 days to complete one revolution.',
#   0.13790743024424898),
#  (\"Isaac Newton's laws of motion and gravity laid the groundwork for classical mechanics.\",
#   0.08071345159269593),
#  ('Light can be described as both a wave and a particle, a concept known as wave-particle duality.',
#   0.06686267900101434)]
cnmoro/TangledLlama33m-Reranker-EnPt-ONNX

作者 cnmoro
text-ranking sentence-transformers
↓ 0 ♥ 0
创建时间: 2025-03-11 13:37:54+00:00
更新时间: 2025-04-02 14:30:20+00:00
在 Hugging Face 上查看
文件 (12)

.gitattributes
README.md
model.onnx ONNX
model_bnb4.onnx ONNX
model_fp16.onnx ONNX
model_int8.onnx ONNX
model_q4.onnx ONNX
model_q4f16.onnx ONNX
model_quantized.onnx ONNX
model_uint8.onnx ONNX
quantize_config.json
tokenizer.json