language:
- en
tags:
- ColBERT
- PyLate
- sentence-transformers
- sentence-similarity
- feature-extraction
- generated_from_trainer
- dataset_size:640000
- loss:Distillation
base_model: NeuML/bert-hash-femto
datasets:
- lightonai/ms-marco-en-bge-gemma
pipeline_tag: sentence-similarity
library_name: PyLate
license: apache-2.0
metrics:
- MaxSim_accuracy@1
- MaxSim_accuracy@3
- MaxSim_accuracy@5
- MaxSim_accuracy@10
- MaxSim_precision@1
- MaxSim_precision@3
- MaxSim_precision@5
- MaxSim_precision@10
- MaxSim_recall@1
- MaxSim_recall@3
- MaxSim_recall@5
- MaxSim_recall@10
- MaxSim_ndcg@10
- MaxSim_mrr@10
- MaxSim_map@100
model-index:
- name: ColBERT MUVERA Femto
results:
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoClimateFEVER
type: NanoClimateFEVER
metrics:
- type: MaxSim_accuracy@1
value: 0.14
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.32
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.36
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.52
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.14
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.11333333333333333
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.07600000000000001
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.05600000000000001
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.085
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.165
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.19166666666666668
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.25233333333333335
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.19115874409066272
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.2408333333333333
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.1462389973257929
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoDBPedia
type: NanoDBPedia
metrics:
- type: MaxSim_accuracy@1
value: 0.7
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.82
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.82
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.84
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.7
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.5933333333333333
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.548
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.456
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.0728506527388449
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.13076941366456654
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.17827350013263704
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.2781635119304686
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.5510945084552747
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.7555555555555555
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.39128533545834626
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoFEVER
type: NanoFEVER
metrics:
- type: MaxSim_accuracy@1
value: 0.62
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.76
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.84
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.86
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.62
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.26666666666666666
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.184
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.09399999999999999
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.5766666666666667
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.7366666666666667
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.83
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.85
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.7249306483092258
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.6976666666666665
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.679664802101873
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoFiQA2018
type: NanoFiQA2018
metrics:
- type: MaxSim_accuracy@1
value: 0.28
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.34
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.44
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.48
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.28
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.13333333333333333
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.10800000000000001
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.062
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.13555555555555557
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.19755555555555557
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.2666349206349206
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.2994920634920635
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.2502784944505909
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.33252380952380944
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.20907273372726215
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoHotpotQA
type: NanoHotpotQA
metrics:
- type: MaxSim_accuracy@1
value: 0.76
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.84
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.9
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.92
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.76
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.36666666666666664
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.252
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.136
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.38
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.55
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.63
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.68
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.6514325561331983
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.8098333333333333
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.5738665952275315
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoMSMARCO
type: NanoMSMARCO
metrics:
- type: MaxSim_accuracy@1
value: 0.32
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.48
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.6
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.7
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.32
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.16
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.12000000000000002
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.07
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.32
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.48
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.6
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.7
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.4946222844793249
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.43052380952380953
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.4408050908765128
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoNFCorpus
type: NanoNFCorpus
metrics:
- type: MaxSim_accuracy@1
value: 0.32
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.42
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.52
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.62
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.32
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.2866666666666666
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.26799999999999996
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.21000000000000005
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.01921769353070746
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.03782391241260524
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.05411010345369293
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.09349869834347448
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.2481257474345093
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.3995793650793651
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.08737709081330662
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoNQ
type: NanoNQ
metrics:
- type: MaxSim_accuracy@1
value: 0.28
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.52
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.58
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.74
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.28
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.1733333333333333
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.12000000000000002
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.07600000000000001
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.26
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.49
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.56
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.7
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.4828411530427104
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.4289603174603174
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.41150699780701017
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoQuoraRetrieval
type: NanoQuoraRetrieval
metrics:
- type: MaxSim_accuracy@1
value: 0.74
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.84
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.88
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.9
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.74
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.30666666666666664
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.21199999999999997
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.11599999999999998
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.674
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.784
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.8413333333333333
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.8626666666666667
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.8016479127266055
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.7995238095238095
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.7733654571274
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoSCIDOCS
type: NanoSCIDOCS
metrics:
- type: MaxSim_accuracy@1
value: 0.3
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.44
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.52
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.62
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.3
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.18
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.14400000000000002
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.092
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.061000000000000006
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.11100000000000002
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.14700000000000002
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.18799999999999997
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.198564235862039
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.3978253968253968
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.13670583023266375
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoArguAna
type: NanoArguAna
metrics:
- type: MaxSim_accuracy@1
value: 0.14
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.24
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.28
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.36
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.14
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.07999999999999999
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.05600000000000001
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.036000000000000004
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.14
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.24
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.28
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.36
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.2444065884095295
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.20804761904761904
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.21989999402599436
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoSciFact
type: NanoSciFact
metrics:
- type: MaxSim_accuracy@1
value: 0.36
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.5
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.6
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.62
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.36
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.18666666666666668
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.14
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.07400000000000001
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.325
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.49
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.59
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.62
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.4856083424090788
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.44449999999999995
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.44726079800650204
name: Maxsim Map@100
- task:
type: py-late-information-retrieval
name: Py Late Information Retrieval
dataset:
name: NanoTouche2020
type: NanoTouche2020
metrics:
- type: MaxSim_accuracy@1
value: 0.6530612244897959
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.9591836734693877
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.9795918367346939
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 1
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.6530612244897959
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.6054421768707483
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.5673469387755103
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.45918367346938777
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.04308959031413618
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.11831839494199368
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.1804772716223025
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.2842813442856462
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.5191595399345652
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.8064625850340136
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.32574548665687825
name: Maxsim Map@100
- task:
type: nano-beir
name: Nano BEIR
dataset:
name: NanoBEIR mean
type: NanoBEIR_mean
metrics:
- type: MaxSim_accuracy@1
value: 0.4317739403453689
name: Maxsim Accuracy@1
- type: MaxSim_accuracy@3
value: 0.5753218210361067
name: Maxsim Accuracy@3
- type: MaxSim_accuracy@5
value: 0.6399686028257457
name: Maxsim Accuracy@5
- type: MaxSim_accuracy@10
value: 0.7061538461538461
name: Maxsim Accuracy@10
- type: MaxSim_precision@1
value: 0.4317739403453689
name: Maxsim Precision@1
- type: MaxSim_precision@3
value: 0.26554683411826263
name: Maxsim Precision@3
- type: MaxSim_precision@5
value: 0.2150266875981162
name: Maxsim Precision@5
- type: MaxSim_precision@10
value: 0.14901412872841444
name: Maxsim Precision@10
- type: MaxSim_recall@1
value: 0.2378753968312239
name: Maxsim Recall@1
- type: MaxSim_recall@3
value: 0.34854876486472214
name: Maxsim Recall@3
- type: MaxSim_recall@5
value: 0.41149967660335024
name: Maxsim Recall@5
- type: MaxSim_recall@10
value: 0.4744950475424349
name: Maxsim Recall@10
- type: MaxSim_ndcg@10
value: 0.44952851967210117
name: Maxsim Ndcg@10
- type: MaxSim_mrr@10
value: 0.5193719693005406
name: Maxsim Mrr@10
- type: MaxSim_map@100
value: 0.3725227084143902
name: Maxsim Map@100
ColBERT MUVERA Femto
This is a PyLate model finetuned from neuml/bert-hash-femto on the msmarco-en-bge-gemma unnormalized split dataset. It maps sentences & paragraphs to sequences of 50-dimensional dense vectors and can be used for semantic textual similarity using the MaxSim operator.
This model is trained with un-normalized scores, making it compatible with MUVERA fixed-dimensional encoding.
Usage (txtai)
This model can be used to build embeddings databases with txtai for semantic search and/or as a knowledge source for retrieval augmented generation (RAG).
Note: txtai 9.0+ is required for late interaction model support
import txtai
embeddings = txtai.Embeddings(
sparse="neuml/colbert-muvera-femto",
content=True
)
embeddings.index(documents())
# Run a query
embeddings.search("query to run")
Late interaction models excel as reranker pipelines.
from txtai.pipeline import Reranker, Similarity
similarity = Similarity(path="neuml/colbert-muvera-femto", lateencode=True)
ranker = Reranker(embeddings, similarity)
ranker("query to run")
Usage (PyLate)
Alternatively, the model can be loaded with PyLate.
from pylate import rank, models
queries = [
"query A",
"query B",
]
documents = [
["document A", "document B"],
["document 1", "document C", "document B"],
]
documents_ids = [
[1, 2],
[1, 3, 2],
]
model = models.ColBERT(
model_name_or_path="neuml/colbert-muvera-femto",
)
queries_embeddings = model.encode(
queries,
is_query=True,
)
documents_embeddings = model.encode(
documents,
is_query=False,
)
reranked_documents = rank.rerank(
documents_ids=documents_ids,
queries_embeddings=queries_embeddings,
documents_embeddings=documents_embeddings,
)
Full Model Architecture
ColBERT(
(0): Transformer({'max_seq_length': 299, 'do_lower_case': False}) with Transformer model: BertHashModel
(1): Dense({'in_features': 50, 'out_features': 50, 'bias': False, 'activation_function': 'torch.nn.modules.linear.Identity'})
)
Evaluation
BEIR Subset
The following table shows a subset of BEIR scored with the txtai benchmarks script.
Scores reported are ndcg@10 and grouped into the following three categories.
FULL multi-vector maxsim
| Model | Parameters | NFCorpus | SciDocs | SciFact | Average |
|---|---|---|---|---|---|
| ColBERT v2 | 110M | 0.3165 | 0.1497 | 0.6456 | 0.3706 |
| ColBERT MUVERA Femto | 0.2M | 0.2513 | 0.0870 | 0.4710 | 0.2698 |
| ColBERT MUVERA Pico | 0.4M | 0.3005 | 0.1117 | 0.6452 | 0.3525 |
| ColBERT MUVERA Nano | 0.9M | 0.3180 | 0.1262 | 0.6576 | 0.3673 |
| ColBERT MUVERA Micro | 4M | 0.3235 | 0.1244 | 0.6676 | 0.3718 |
MUVERA encoding + maxsim re-ranking of the top 100 results per MUVERA paper
| Model | Parameters | NFCorpus | SciDocs | SciFact | Average |
|---|---|---|---|---|---|
| ColBERT v2 | 110M | 0.3025 | 0.1538 | 0.6278 | 0.3614 |
| ColBERT MUVERA Femto | 0.2M | 0.2316 | 0.0858 | 0.4641 | 0.2605 |
| ColBERT MUVERA Pico | 0.4M | 0.2821 | 0.1004 | 0.6090 | 0.3305 |
| ColBERT MUVERA Nano | 0.9M | 0.2996 | 0.1201 | 0.6249 | 0.3482 |
| ColBERT MUVERA Micro | 4M | 0.3095 | 0.1228 | 0.6464 | 0.3596 |
MUVERA encoding only
| Model | Parameters | NFCorpus | SciDocs | SciFact | Average |
|---|---|---|---|---|---|
| ColBERT v2 | 110M | 0.2356 | 0.1229 | 0.5002 | 0.2862 |
| ColBERT MUVERA Femto | 0.2M | 0.1851 | 0.0411 | 0.3518 | 0.1927 |
| ColBERT MUVERA Pico | 0.4M | 0.1926 | 0.0564 | 0.4424 | 0.2305 |
| ColBERT MUVERA Nano | 0.9M | 0.2355 | 0.0807 | 0.4904 | 0.2689 |
| ColBERT MUVERA Micro | 4M | 0.2348 | 0.0882 | 0.4875 | 0.2702 |
Note: The scores reported don't match scores reported in the respective papers due to different default settings in the txtai benchmark scripts.
As noted earlier, models trained with min-max score normalization don't perform well with MUVERA encoding. See this GitHub Issue for more.
This model is only 250K parameters with a file size of 950K. Keeping that in mind, it's surprising how decent the scores are!
Nano BEIR
- Dataset:
NanoBEIR_mean - Evaluated with
pylate.evaluation.nano_beir_evaluator.NanoBEIREvaluator
| Metric | Value |
|---|---|
| MaxSim_accuracy@1 | 0.4318 |
| MaxSim_accuracy@3 | 0.5753 |
| MaxSim_accuracy@5 | 0.64 |
| MaxSim_accuracy@10 | 0.7062 |
| MaxSim_precision@1 | 0.4318 |
| MaxSim_precision@3 | 0.2655 |
| MaxSim_precision@5 | 0.215 |
| MaxSim_precision@10 | 0.149 |
| MaxSim_recall@1 | 0.2379 |
| MaxSim_recall@3 | 0.3485 |
| MaxSim_recall@5 | 0.4115 |
| MaxSim_recall@10 | 0.4745 |
| MaxSim_ndcg@10 | 0.4495 |
| MaxSim_mrr@10 | 0.5194 |
| MaxSim_map@100 | 0.3725 |
Training Details
Training Hyperparameters
Non-Default Hyperparameters
eval_strategy: stepsper_device_train_batch_size: 32learning_rate: 0.0003num_train_epochs: 1warmup_ratio: 0.05fp16: True
All Hyperparameters
Click to expand
overwrite_output_dir: Falsedo_predict: Falseeval_strategy: stepsprediction_loss_only: Trueper_device_train_batch_size: 32per_device_eval_batch_size: 8per_gpu_train_batch_size: Noneper_gpu_eval_batch_size: Nonegradient_accumulation_steps: 1eval_accumulation_steps: Nonetorch_empty_cache_steps: Nonelearning_rate: 0.0003weight_decay: 0.0adam_beta1: 0.9adam_beta2: 0.999adam_epsilon: 1e-08max_grad_norm: 1.0num_train_epochs: 1max_steps: -1lr_scheduler_type: linearlr_scheduler_kwargs: {}warmup_ratio: 0.05warmup_steps: 0log_level: passivelog_level_replica: warninglog_on_each_node: Truelogging_nan_inf_filter: Truesave_safetensors: Truesave_on_each_node: Falsesave_only_model: Falserestore_callback_states_from_checkpoint: Falseno_cuda: Falseuse_cpu: Falseuse_mps_device: Falseseed: 42data_seed: Nonejit_mode_eval: Falsebf16: Falsefp16: Truefp16_opt_level: O1half_precision_backend: autobf16_full_eval: Falsefp16_full_eval: Falsetf32: Nonelocal_rank: 0ddp_backend: Nonetpu_num_cores: Nonetpu_metrics_debug: Falsedebug: []dataloader_drop_last: Falsedataloader_num_workers: 0dataloader_prefetch_factor: Nonepast_index: -1disable_tqdm: Falseremove_unused_columns: Truelabel_names: Noneload_best_model_at_end: Falseignore_data_skip: Falsefsdp: []fsdp_min_num_params: 0fsdp_config: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}fsdp_transformer_layer_cls_to_wrap: Noneaccelerator_config: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}parallelism_config: Nonedeepspeed: Nonelabel_smoothing_factor: 0.0optim: adamw_torch_fusedoptim_args: Noneadafactor: Falsegroup_by_length: Falselength_column_name: lengthproject: huggingfacetrackio_space_id: trackioddp_find_unused_parameters: Noneddp_bucket_cap_mb: Noneddp_broadcast_buffers: Falsedataloader_pin_memory: Truedataloader_persistent_workers: Falseskip_memory_metrics: Trueuse_legacy_prediction_loop: Falsepush_to_hub: Falseresume_from_checkpoint: Nonehub_model_id: Nonehub_strategy: every_savehub_private_repo: Nonehub_always_push: Falsehub_revision: Nonegradient_checkpointing: Falsegradient_checkpointing_kwargs: Noneinclude_inputs_for_metrics: Falseinclude_for_metrics: []eval_do_concat_batches: Truefp16_backend: autopush_to_hub_model_id: Nonepush_to_hub_organization: Nonemp_parameters:auto_find_batch_size: Falsefull_determinism: Falsetorchdynamo: Noneray_scope: lastddp_timeout: 1800torch_compile: Falsetorch_compile_backend: Nonetorch_compile_mode: Noneinclude_tokens_per_second: Falseinclude_num_input_tokens_seen: noneftune_noise_alpha: Noneoptim_target_modules: Nonebatch_eval_metrics: Falseeval_on_start: Falseuse_liger_kernel: Falseliger_kernel_config: Noneeval_use_gather_object: Falseaverage_tokens_across_devices: Trueprompts: Nonebatch_sampler: batch_samplermulti_dataset_batch_sampler: proportional
Framework Versions
- Python: 3.10.18
- Sentence Transformers: 4.0.2
- PyLate: 1.3.2
- Transformers: 4.57.0
- PyTorch: 2.8.0+cu128
- Accelerate: 1.10.1
- Datasets: 4.1.1
- Tokenizers: 0.22.1
Citation
BibTeX
Sentence Transformers
@inproceedings{reimers-2019-sentence-bert,
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
author = "Reimers, Nils and Gurevych, Iryna",
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
month = "11",
year = "2019",
publisher = "Association for Computational Linguistics",
url = "https://arxiv.org/abs/1908.10084"
}
PyLate
@misc{PyLate,
title={PyLate: Flexible Training and Retrieval for Late Interaction Models},
author={Chaffin, Antoine and Sourty, Raphaël},
url={https://github.com/lightonai/pylate},
year={2024}
}