Skip to content

Commit 94010c7

Browse files
committed
Add docstring for encode_kwargs
1 parent 82d37a3 commit 94010c7

File tree

7 files changed

+16
-0
lines changed

7 files changed

+16
-0
lines changed

src/jmteb/embedders/base.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,7 @@ def encode(self, text: str | list[str], prefix: str | None = None, **kwargs) ->
2525
Args:
2626
text (str | list[str]): text string, or a list of texts.
2727
prefix (str, optional): the prefix to use for encoding. Default to None.
28+
**kwargs: some more settings that may be necessary for specific models.
2829
"""
2930
raise NotImplementedError
3031

src/jmteb/evaluators/classification/evaluator.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -29,6 +29,7 @@ class ClassificationEvaluator(EmbeddingEvaluator):
2929
classifiers (dict[str, Classifier]): classifiers to be evaluated.
3030
prefix (str | None): prefix for sentences. Defaults to None.
3131
log_predictions (bool): whether to log predictions of each datapoint.
32+
encode_kwargs (dict): kwargs passed to embedder's encode function. Defaults to {}.
3233
"""
3334

3435
def __init__(

src/jmteb/evaluators/clustering/evaluator.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,14 @@
2424
class ClusteringEvaluator(EmbeddingEvaluator):
2525
"""
2626
ClusteringEvaluator is a class for evaluating clustering models.
27+
28+
Args:
29+
val_dataset (ClusteringDataset): validation dataset
30+
test_dataset (ClusteringDataset): evaluation dataset
31+
prefix (str | None): prefix for sentences. Defaults to None.
32+
random_seed (int | None): random seed used in clustering models. Defaults to None.
33+
log_predictions (bool): whether to log predictions of each datapoint.
34+
encode_kwargs (dict): kwargs passed to embedder's encode function. Defaults to {}.
2735
"""
2836

2937
def __init__(

src/jmteb/evaluators/pair_classification/evaluator.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,7 @@ class PairClassificationEvaluator(EmbeddingEvaluator):
2222
test_dataset (PairClassificationDataset): test dataset
2323
sentence1_prefix (str | None): prefix for sentence1. Defaults to None.
2424
sentence2_prefix (str | None): prefix for sentence2. Defaults to None.
25+
encode_kwargs (dict): kwargs passed to embedder's encode function. Default to {}.
2526
2627
# NOTE: Don't log predictions, as predictions by different metrics could be different.
2728
"""

src/jmteb/evaluators/reranking/evaluator.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -39,6 +39,8 @@ class RerankingEvaluator(EmbeddingEvaluator):
3939
doc_prefix (str | None): prefix for documents. Defaults to None.
4040
log_predictions (bool): whether to log predictions of each datapoint. Defaults to False.
4141
top_n_docs_to_log (int): log only top n documents. Defaults to 5.
42+
query_encode_kwargs (dict): kwargs passed to embedder's encode function when encoding queries. Defaults to {}.
43+
doc_encode_kwargs (dict): kwargs passed to embedder's encode function when encoding documents. Defaults to {}.
4244
"""
4345

4446
def __init__(

src/jmteb/evaluators/retrieval/evaluator.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -42,6 +42,8 @@ class RetrievalEvaluator(EmbeddingEvaluator):
4242
doc_prefix (str | None): prefix for documents. Defaults to None.
4343
log_predictions (bool): whether to log predictions of each datapoint. Defaults to False.
4444
top_n_docs_to_log (int): log only top n documents that are predicted as relevant. Defaults to 5.
45+
query_encode_kwargs (dict): kwargs passed to embedder's encode function when encoding queries. Defaults to {}.
46+
doc_encode_kwargs (dict): kwargs passed to embedder's encode function when encoding documents. Defaults to {}.
4547
"""
4648

4749
def __init__(

src/jmteb/evaluators/sts/evaluator.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,7 @@ class STSEvaluator(EmbeddingEvaluator):
2626
test_dataset (STSDataset): test dataset
2727
sentence1_prefix (str | None): prefix for sentence1. Defaults to None.
2828
sentence2_prefix (str | None): prefix for sentence2. Defaults to None.
29+
encode_kwargs (dict): kwargs passed to embedder's encode function. Defaults to {}.
2930
"""
3031

3132
def __init__(

0 commit comments

Comments
 (0)