Skip to content

Commit

Permalink
Merge branch 'refs/heads/main' into v2.0.0
Browse files Browse the repository at this point in the history
# Conflicts:
#	mteb/models/e5_models.py
#	mteb/models/gme_models.py
#	mteb/models/gritlm_models.py
#	mteb/models/jina_models.py
#	mteb/models/lens_models.py
#	mteb/models/llm2vec_models.py
#	mteb/models/overview.py
#	mteb/models/salesforce_models.py
#	mteb/models/sentence_transformers_models.py
  • Loading branch information
Samoed committed Jan 24, 2025
2 parents f1d418c + fa5127a commit c26adee
Showing 1 changed file with 55 additions and 0 deletions.
55 changes: 55 additions & 0 deletions mteb/models/ru_sentence_models.py
Original file line number Diff line number Diff line change
Expand Up @@ -160,6 +160,61 @@
public_training_data=None,
)

user_bge_m3 = ModelMeta(
loader=partial( # type: ignore
sentence_transformers_loader,
model_name="deepvk/USER-bge-m3",
revision="0cc6cfe48e260fb0474c753087a69369e88709ae",
),
name="deepvk/USER-bge-m3",
languages=["rus_Cyrl"],
open_weights=True,
revision="0cc6cfe48e260fb0474c753087a69369e88709ae",
release_date="2024-07-05",
n_parameters=359_026_688,
embed_dim=1024,
license="apache-2.0",
max_tokens=8194,
reference="https://huggingface.co/deepvk/USER-base",
similarity_fn_name="cosine",
framework=["Sentence Transformers", "PyTorch"],
adapted_from="https://huggingface.co/BAAI/bge-m3",
use_instructions=False,
training_datasets={
"BibleNLPBitextMining": ["train"],
# https://github.com/unicamp-dl/mMARCO
# deepvk/ru-HNP
# deepvk/ru-WANLI
# MedNLI
# RCB
"TERRa": ["train"],
# Tapaco
# Opus100
# BiblePar
# RudetoxifierDataDetox
# RuParadetox
"MIRACL": ["train"],
# MLDR
# Lenta
"MLSUMClusteringP2P": ["train"],
"MLSUMClusteringP2P.v2": ["train"],
"MLSUMClusteringS2S": ["train"],
"MLSUMClusteringS2S.v2": ["train"],
"MrTidyRetrieval": ["train"],
# "Panorama"
# PravoIsrael
# xlsum
# Fialka-v1
# RussianKeywords
# Gazeta
# Gsm8k-ru
# DSumRu
# SummDialogNews
},
public_training_code=None,
public_training_data=None,
)

user_bge_m3 = ModelMeta(
loader=partial( # type: ignore
sentence_transformers_loader,
Expand Down

0 comments on commit c26adee

Please sign in to comment.