From 5dcb58d54e54aa2319b310fe30504eb6bd0eb767 Mon Sep 17 00:00:00 2001 From: sergeyz-zh <49659999+sergeyz-zh@users.noreply.github.com> Date: Tue, 11 Mar 2025 17:46:12 +0300 Subject: [PATCH 1/2] Add rubert-mini-frida model meta --- mteb/models/ru_sentence_models.py | 26 ++++++++++++++++++++++++++ 1 file changed, 26 insertions(+) diff --git a/mteb/models/ru_sentence_models.py b/mteb/models/ru_sentence_models.py index 905fb6550a..5775f62d2c 100644 --- a/mteb/models/ru_sentence_models.py +++ b/mteb/models/ru_sentence_models.py @@ -357,6 +357,32 @@ adapted_from="cointegrated/rubert-tiny2", ) +rubert_mini_frida = ModelMeta( + name="sergeyzh/rubert-mini-frida", + languages=["rus_Cyrl"], + open_weights=True, + revision="19b279b78afd945b5ccae78f63e284909814adc2", + release_date="2025-03-02", + n_parameters=32_300_000, + memory_usage_mb=123, + embed_dim=312, + license="mit", + max_tokens=2048, + reference="https://huggingface.co/sergeyzh/rubert-mini-frida", + similarity_fn_name="cosine", + framework=["Sentence Transformers", "PyTorch"], + use_instructions=True, + public_training_code=None, + public_training_data=None, + training_datasets={ + # https://huggingface.co/datasets/IlyaGusev/gazeta + # https://huggingface.co/datasets/zloelias/lenta-ru + # https://huggingface.co/datasets/HuggingFaceFW/fineweb-2 + # https://huggingface.co/datasets/HuggingFaceFW/fineweb + }, + adapted_from="sergeyzh/rubert-mini-sts", +) + labse_ru_turbo = ModelMeta( name="sergeyzh/LaBSE-ru-turbo", languages=["rus_Cyrl"], From 3fa111722e28c7ec8a5548aab51ec046cdebc7dc Mon Sep 17 00:00:00 2001 From: sergeyz-zh <49659999+sergeyz-zh@users.noreply.github.com> Date: Tue, 11 Mar 2025 17:47:35 +0300 Subject: [PATCH 2/2] Add BERTA model meta --- mteb/models/ru_sentence_models.py | 26 ++++++++++++++++++++++++++ 1 file changed, 26 insertions(+) diff --git a/mteb/models/ru_sentence_models.py b/mteb/models/ru_sentence_models.py index 5775f62d2c..c3c63d5461 100644 --- a/mteb/models/ru_sentence_models.py +++ b/mteb/models/ru_sentence_models.py @@ -404,6 +404,32 @@ public_training_data=None, ) +berta = ModelMeta( + name="sergeyzh/BERTA", + languages=["rus_Cyrl"], + open_weights=True, + revision="914c8c8aed14042ed890fc2c662d5e9e66b2faa7", + release_date="2025-03-10", + n_parameters=128_000_000, + memory_usage_mb=489, + embed_dim=768, + license="mit", + max_tokens=512, + reference="https://huggingface.co/sergeyzh/BERTA", + similarity_fn_name="cosine", + framework=["Sentence Transformers", "PyTorch"], + use_instructions=True, + training_datasets={ + # https://huggingface.co/datasets/IlyaGusev/gazeta + # https://huggingface.co/datasets/zloelias/lenta-ru + # https://huggingface.co/datasets/HuggingFaceFW/fineweb-2 + # https://huggingface.co/datasets/HuggingFaceFW/fineweb + }, + public_training_code=None, + adapted_from="sergeyzh/LaBSE-ru-turbo", + public_training_data=None, +) + rosberta_prompts = { # Default "Classification": "classification: ",