Skip to content

Commit

Permalink
update embd batch size
Browse files Browse the repository at this point in the history
  • Loading branch information
henry-yeh committed Sep 9, 2024
1 parent a4a6fe4 commit 887107a
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion gpv/embd.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,7 @@ def __init__(self, model_name_or_path: str='Alibaba-NLP/gte-multilingual-base',
self.tokenizer = AutoTokenizer.from_pretrained(model_name_or_path)


def get_embedding(self, input_texts: list[str], dimension: int = 768, batch_size: int = 16) -> torch.Tensor:
def get_embedding(self, input_texts: list[str], dimension: int = 768, batch_size: int = 8) -> torch.Tensor:
"""
Get the sentence embeddings of the input texts.
Expand Down

0 comments on commit 887107a

Please sign in to comment.