OpenCompass/opencompass/openicl/icl_evaluator/icl_bpc_evaluator.py

from typing import List

import numpy as np

from opencompass.registry import ICL_EVALUATORS

from .icl_base_evaluator import BaseEvaluator


@ICL_EVALUATORS.register_module()
class BPCEvaluator(BaseEvaluator):

    def score(self, loss: List[float], total_chr_num: List[float]):
        """Calculate bits per character based on inference results.

        Args:
            loss (List[float]): CrossEntropyLoss per batch x sliding
            context window
            total_chr_num (List[float]): Total number of characters
            in the original dataset.

        Returns:
            Dict[str, float]: Bits per Character
        """
        total_loss = sum(loss)

        # Multiplying by log(2) to correct for the constant shift
        # due to natural log used in the PyTorch implementation
        # of CrossEntropyLoss
        bpc = total_loss / (total_chr_num[0] * np.log(2))

        return {'bpc': bpc}
[Feature] Adding support for LLM Compression Evaluation (#1108) * fixed formatting based on pre-commit tests * fixed typo in comments; reduced the number of models in the eval config * fixed a bug in LLMCompressionDataset, where setting samples=None would result in passing test[:None] to load_dataset * removed unnecessary variable in _format_table_pivot; changed lark_reporter message to English 2024-04-30 10:51:01 +08:00			`from typing import List`

			`import numpy as np`

			`from opencompass.registry import ICL_EVALUATORS`

			`from .icl_base_evaluator import BaseEvaluator`


			`@ICL_EVALUATORS.register_module()`
			`class BPCEvaluator(BaseEvaluator):`

			`def score(self, loss: List[float], total_chr_num: List[float]):`
			`"""Calculate bits per character based on inference results.`

			`Args:`
			`loss (List[float]): CrossEntropyLoss per batch x sliding`
			`context window`
			`total_chr_num (List[float]): Total number of characters`
			`in the original dataset.`

			`Returns:`
			`Dict[str, float]: Bits per Character`
			`"""`
			`total_loss = sum(loss)`

			`# Multiplying by log(2) to correct for the constant shift`
			`# due to natural log used in the PyTorch implementation`
			`# of CrossEntropyLoss`
			`bpc = total_loss / (total_chr_num[0] * np.log(2))`

			`return {'bpc': bpc}`