From 46cd631e137075e0d0704d2f4a02c42a21100acf Mon Sep 17 00:00:00 2001 From: jnanliu Date: Wed, 26 Feb 2025 03:53:10 +0000 Subject: [PATCH] recover pre-commit and edit math expr in doc --- .pre-commit-config-zh-cn.yaml | 7 +------ .pre-commit-config.yaml | 7 +------ docs/en/user_guides/datasets.md | 11 +++++++---- docs/zh_cn/user_guides/datasets.md | 10 ++++++---- 4 files changed, 15 insertions(+), 20 deletions(-) diff --git a/.pre-commit-config-zh-cn.yaml b/.pre-commit-config-zh-cn.yaml index d8d58935..2e21c85d 100644 --- a/.pre-commit-config-zh-cn.yaml +++ b/.pre-commit-config-zh-cn.yaml @@ -88,12 +88,7 @@ repos: - mdformat-openmmlab - mdformat_frontmatter - linkify-it-py - exclude: | - (?x)^( - configs/ | - docs/zh_cn/user_guides/datasets.md | - docs/en/user_guides/datasets.md - ) + exclude: configs/ - repo: https://gitee.com/openmmlab/mirrors-docformatter rev: v1.3.1 hooks: diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml index f5a70d4e..9f72ae42 100644 --- a/.pre-commit-config.yaml +++ b/.pre-commit-config.yaml @@ -88,12 +88,7 @@ repos: - mdformat-openmmlab - mdformat_frontmatter - linkify-it-py - exclude: | - (?x)^( - configs/ | - docs/zh_cn/user_guides/datasets.md | - docs/en/user_guides/datasets.md - ) + exclude: configs/ - repo: https://github.com/myint/docformatter rev: v1.3.1 hooks: diff --git a/docs/en/user_guides/datasets.md b/docs/en/user_guides/datasets.md index 22589cbf..83460672 100644 --- a/docs/en/user_guides/datasets.md +++ b/docs/en/user_guides/datasets.md @@ -82,7 +82,6 @@ Users can choose different abilities, different datasets and different evaluatio For information on how to start an evaluation task and how to evaluate self-built datasets, please refer to the relevant documents. - ### Multiple Evaluations on the Dataset In the dataset configuration, you can set the parameter `n` to perform multiple evaluations on the same dataset and return the average metrics, for example: @@ -99,11 +98,15 @@ afqmc_datasets = [ eval_cfg=afqmc_eval_cfg, ), ] + ``` -> [!TIP] + +> \[!TIP\] > Additionally, for binary evaluation metrics (such as accuracy, pass-rate, etc.), you can also set the parameter `k` in conjunction with `n` for [G-Pass@k](http://arxiv.org/abs/2412.13147) evaluation. The formula for G-Pass@k is: > -> $$ \text{G-Pass@}k_\tau=E_{\text{Data}}\left[ \sum_{j=\lceil \tau \cdot k \rceil}^c \frac{{c \choose j} \cdot {n - c \choose k - j}}{{n \choose k}} \right], $$ +> ```{math} +> \text{G-Pass@}k_\tau=E_{\text{Data}}\left[ \sum_{j=\lceil \tau \cdot k \rceil}^c \frac{{c \choose j} \cdot {n - c \choose k - j}}{{n \choose k}} \right], +> ``` > > where $n$ is the number of evaluations, and $c$ is the number of times that passed or were correct out of $n$ runs. An example configuration is as follows: @@ -118,4 +121,4 @@ aime2024_datasets = [ ... ) ] -``` \ No newline at end of file +``` diff --git a/docs/zh_cn/user_guides/datasets.md b/docs/zh_cn/user_guides/datasets.md index dcd4c301..d22d57f6 100644 --- a/docs/zh_cn/user_guides/datasets.md +++ b/docs/zh_cn/user_guides/datasets.md @@ -100,10 +100,12 @@ afqmc_datasets = [ ] ``` -> [!TIP] -> 另外,对于二值评测指标(例如accuracy,pass-rate等),还可以通过设置参数`k`配合`n`进行[G-Pass@k](http://arxiv.org/abs/2412.13147)评测。G-Pass@k计算公式为: -> -> $$ \text{G-Pass@}k_\tau=E_{\text{Data}}\left[ \sum_{j=\lceil \tau \cdot k \rceil}^c \frac{{c \choose j} \cdot {n - c \choose k - j}}{{n \choose k}} \right], $$ +> \[!TIP\] +> 另外,对于二值评测指标(例如accuracy,pass-rate等),还可以通过设置参数`k`配合`n`进行[G-Pass@k](http://arxiv.org/abs/2412.13147)评测。G-Pass@k计算公式为: +> +> ```{math} +> \text{G-Pass@}k_\tau=E_{\text{Data}}\left[ \sum_{j=\lceil \tau \cdot k \rceil}^c \frac{{c \choose j} \cdot {n - c \choose k - j}}{{n \choose k}} \right], +> ``` > > 其中 $n$ 为评测次数, $c$ 为 $n$ 次运行中通过或正确的次数。配置例子如下: