Skip to content

Commit 2af64c8

Browse files
authored
fix: add bert_score_dissimilarity description (#193)
1 parent 7982a0f commit 2af64c8

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

src/fmeval/reporting/constants.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@
3232
DELTA_BERT_SCORE,
3333
DELTA_METEOR_SCORE,
3434
)
35-
from fmeval.eval_algorithms.general_semantic_robustness import WER_SCORE
35+
from fmeval.eval_algorithms.general_semantic_robustness import WER_SCORE, BERT_SCORE_DISSIMILARITY
3636
from fmeval.eval_algorithms import (
3737
TREX,
3838
BOOLQ,
@@ -188,6 +188,7 @@ class ListType(Enum):
188188
BALANCED_ACCURACY_SCORE: "The balanced accuracy score is the same as accuracy in the binary case, otherwise averaged recall per class.",
189189
# General semantic robustness
190190
WER_SCORE: "Word error rate (WER) is a value between 0 and 1, and measures the difference between the model output on the unperturbed input and the output(s) on one or more perturbed versions of the same input. For more details on how word error rate is computed, see the [HuggingFace Article on Word Error Rate](https://huggingface.co/spaces/evaluate-metric/wer).",
191+
BERT_SCORE_DISSIMILARITY: "BERTScore Dissimilarity is computed as 1 - BERTScore and measures semantic differences between the original and perturbed versions of the same input.",
191192
# Summarization semantic robustness
192193
DELTA_ROUGE_SCORE: "Delta ROUGE-N score measures the change in Rouge between the original and perturbed versions of the same input.",
193194
DELTA_METEOR_SCORE: "Delta Meteor score measures the change in Meteor between the original and perturbed versions of the same input.",

0 commit comments

Comments
 (0)