[Feat] refine docs and codes for more user guides (#409)

2025-05-30 16:03:24 +08:00 · 2023-09-18 16:12:13 +08:00 · 2023-09-18 16:12:13 +08:00 · 2c15a0c01d
commit 2c15a0c01d
parent a11cb45c83
3 changed files with 22 additions and 10 deletions
--- a/configs/datasets/truthfulqa/truthfulqa_gen_1e7d8d.py
+++ b/configs/datasets/truthfulqa/truthfulqa_gen_1e7d8d.py
@ -18,8 +18,11 @@ truthfulqa_infer_cfg = dict(
 # Metrics such as 'truth' and 'info' needs
 # OPENAI_API_KEY with finetuned models in it.
 # Please use your own finetuned openai model with keys and refers to
-# the source code for more details
+# the source code of `TruthfulQAEvaluator` for more details.
-# Metrics such as 'bleurt', 'rouge', 'bleu' are free to test
+#
 # If you cannot provide available models for 'truth' and 'info',
 # and want to perform basic metric eval, please set
 # `metrics=('bleurt', 'rouge', 'bleu')`
 # When key is set to "ENV", the key will be fetched from the environment
 # variable $OPENAI_API_KEY. Otherwise, set key in here directly.
--- a/configs/datasets/truthfulqa/truthfulqa_gen_5ddc62.py
+++ b/configs/datasets/truthfulqa/truthfulqa_gen_5ddc62.py
@ -20,8 +20,11 @@ truthfulqa_infer_cfg = dict(
 # Metrics such as 'truth' and 'info' needs
 # OPENAI_API_KEY with finetuned models in it.
 # Please use your own finetuned openai model with keys and refers to
-# the source code for more details
+# the source code of `TruthfulQAEvaluator` for more details.
-# Metrics such as 'bleurt', 'rouge', 'bleu' are free to test
+#
 # If you cannot provide available models for 'truth' and 'info',
 # and want to perform basic metric eval, please set
 # `metrics=('bleurt', 'rouge', 'bleu')`
 # When key is set to "ENV", the key will be fetched from the environment
 # variable $OPENAI_API_KEY. Otherwise, set key in here directly.
--- a/opencompass/datasets/truthfulqa.py
+++ b/opencompass/datasets/truthfulqa.py
@ -39,7 +39,9 @@ class TruthfulQAEvaluator(BaseEvaluator):
    Args:
        truth_model (str): Truth model name. See "notes" for details.
            Defaults to ''.
        info_model (str): Informativeness model name. See "notes" for details.
            Defaults to ''.
        metrics (tuple): Computing needed metrics for truthfulqa dataset.
            Supported metrics are `bleurt`, `rouge`, `bleu`, `truth`, `info`.
        key (str): Corresponding API key. If set to `ENV`, find it in
@ -67,10 +69,9 @@ class TruthfulQAEvaluator(BaseEvaluator):
        'bleu': 'bleu',
    }
-    def __init__(
+    def __init__(self,
-            self,
+                 truth_model: str = '',
-            truth_model: str,  # noqa
+                 info_model: str = '',
            info_model: str,  # noqa
                 metrics=('bleurt', 'rouge', 'bleu', 'truth', 'info'),
                 key='ENV'):
        self.API_MODEL = {
@ -85,6 +86,11 @@ class TruthfulQAEvaluator(BaseEvaluator):
            if metric in self.SCORE_KEY.keys():
                self.metrics.append(metric)
            if metric in self.API_MODEL.keys():
                assert self.API_MODEL.get(metric), \
                    f'`{metric}_model` should be set to perform API eval.' \
                    'If you want to perform basic metric eval, ' \
                    f'please refer to the docstring of {__file__} ' \
                    'for more details.'
                self.api_metrics.append(metric)
        if self.api_metrics: