Skip to content

Commit 73168c6

Browse files
authored
fix: Updated metadata on model memory (#3624)
fix model memory
1 parent 7e2fa98 commit 73168c6

File tree

8 files changed

+15
-15
lines changed

8 files changed

+15
-15
lines changed

mteb/models/model_implementations/google_models.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -275,5 +275,5 @@ def gemma_embedding_loader(model_name: str, revision: str, **kwargs):
275275
public_training_data=None,
276276
training_datasets=GECKO_TRAINING_DATA,
277277
similarity_fn_name="cosine",
278-
memory_usage_mb=578,
278+
memory_usage_mb=1155,
279279
)

mteb/models/model_implementations/nb_sbert.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@
1111
revision="b95656350a076aeafd2d23763660f80655408cc6",
1212
release_date="2022-11-23",
1313
n_parameters=1_780_000_000,
14-
memory_usage_mb=197,
14+
memory_usage_mb=678,
1515
embed_dim=4096,
1616
license="apache-2.0",
1717
max_tokens=75,

mteb/models/model_implementations/nvidia_llama_nemoretriever_colemb.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -146,7 +146,7 @@ def encode(
146146
release_date="2025-06-27",
147147
modalities=["image", "text"],
148148
n_parameters=2_418_000_000,
149-
memory_usage_mb=9224,
149+
memory_usage_mb=4610,
150150
max_tokens=8192,
151151
embed_dim=2048,
152152
license="https://huggingface.co/nvidia/llama-nemoretriever-colembed-1b-v1/blob/main/LICENSE",
@@ -172,7 +172,7 @@ def encode(
172172
release_date="2025-06-27",
173173
modalities=["image", "text"],
174174
n_parameters=4_407_000_000,
175-
memory_usage_mb=16811,
175+
memory_usage_mb=8403,
176176
max_tokens=8192,
177177
embed_dim=3072,
178178
license="https://huggingface.co/nvidia/llama-nemoretriever-colembed-1b-v1/blob/main/LICENSE",

mteb/models/model_implementations/nvidia_models.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -146,7 +146,7 @@ def instruction_template(
146146
revision="570834afd5fef5bf3a3c2311a2b6e0a66f6f4f2c",
147147
release_date="2024-09-13", # initial commit of hf model.
148148
n_parameters=7_850_000_000,
149-
memory_usage_mb=29945,
149+
memory_usage_mb=14975,
150150
embed_dim=4096,
151151
license="cc-by-nc-4.0",
152152
max_tokens=32768,

mteb/models/model_implementations/ops_moa_models.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@ def encode(self, sentences: list[str], **kwargs) -> np.ndarray:
2727
languages=["zho-Hans"],
2828
loader=OPSWrapper,
2929
n_parameters=int(343 * 1e6),
30-
memory_usage_mb=2e3,
30+
memory_usage_mb=1308,
3131
max_tokens=512,
3232
embed_dim=1536,
3333
license="cc-by-nc-4.0",
@@ -58,7 +58,7 @@ def encode(self, sentences: list[str], **kwargs) -> np.ndarray:
5858
languages=["zho-Hans"],
5959
loader=OPSWrapper,
6060
n_parameters=int(343 * 1e6),
61-
memory_usage_mb=2e3,
61+
memory_usage_mb=1242,
6262
max_tokens=512,
6363
embed_dim=1536,
6464
license="cc-by-nc-4.0",

mteb/models/model_implementations/promptriever_models.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -80,7 +80,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol:
8080
revision="01c7f73d771dfac7d292323805ebc428287df4f9-30b14e3813c0fa45facfd01a594580c3fe5ecf23", # base-peft revision
8181
release_date="2024-09-15",
8282
n_parameters=7_000_000_000,
83-
memory_usage_mb=27,
83+
memory_usage_mb=26703,
8484
max_tokens=4096,
8585
embed_dim=4096,
8686
license="apache-2.0",
@@ -115,7 +115,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol:
115115
},
116116
release_date="2024-09-15",
117117
n_parameters=8_000_000_000,
118-
memory_usage_mb=31,
118+
memory_usage_mb=30518,
119119
max_tokens=8192,
120120
embed_dim=4096,
121121
license="apache-2.0",
@@ -143,7 +143,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol:
143143
revision="5206a32e0bd3067aef1ce90f5528ade7d866253f-8b677258615625122c2eb7329292b8c402612c21", # base-peft revision
144144
release_date="2024-09-15",
145145
n_parameters=8_000_000_000,
146-
memory_usage_mb=31,
146+
memory_usage_mb=30518,
147147
max_tokens=8192,
148148
embed_dim=4096,
149149
training_datasets={
@@ -175,7 +175,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol:
175175
revision="7231864981174d9bee8c7687c24c8344414eae6b-876d63e49b6115ecb6839893a56298fadee7e8f5", # base-peft revision
176176
release_date="2024-09-15",
177177
n_parameters=7_000_000_000,
178-
memory_usage_mb=27,
178+
memory_usage_mb=26703,
179179
training_datasets={
180180
# "samaya-ai/msmarco-w-instructions",
181181
"mMARCO-NL", # translation not trained on

mteb/models/model_implementations/qwen3_models.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -139,7 +139,7 @@ def q3e_instruct_loader(
139139
revision="b22da495047858cce924d27d76261e96be6febc0", # Commit of @tomaarsen
140140
release_date="2025-06-05",
141141
n_parameters=595776512,
142-
memory_usage_mb=2272,
142+
memory_usage_mb=1136,
143143
embed_dim=1024,
144144
max_tokens=32768,
145145
license="apache-2.0",
@@ -161,7 +161,7 @@ def q3e_instruct_loader(
161161
revision="636cd9bf47d976946cdbb2b0c3ca0cb2f8eea5ff", # Commit of @tomaarsen
162162
release_date="2025-06-05",
163163
n_parameters=4021774336,
164-
memory_usage_mb=15341,
164+
memory_usage_mb=7671,
165165
embed_dim=2560,
166166
max_tokens=32768,
167167
license="apache-2.0",
@@ -183,7 +183,7 @@ def q3e_instruct_loader(
183183
revision="4e423935c619ae4df87b646a3ce949610c66241c", # Commit of @tomaarsen
184184
release_date="2025-06-05",
185185
n_parameters=7567295488,
186-
memory_usage_mb=28866,
186+
memory_usage_mb=14433,
187187
embed_dim=4096,
188188
max_tokens=32768,
189189
license="apache-2.0",

mteb/models/model_implementations/qzhou_models.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -63,7 +63,7 @@ def instruction_template(
6363
revision="f1e6c03ee3882e7b9fa5cec91217715272e433b8",
6464
release_date="2025-08-24",
6565
n_parameters=7_070_619_136,
66-
memory_usage_mb=29070,
66+
memory_usage_mb=14436,
6767
embed_dim=3584,
6868
license="apache-2.0",
6969
max_tokens=8192,

0 commit comments

Comments
 (0)