From b3cbef322676ade0d6c2d78d4fcb2ad033fc22a5 Mon Sep 17 00:00:00 2001
From: jingmingzhuo <109033042+jingmingzhuo@users.noreply.github.com>
Date: Thu, 9 Nov 2023 22:05:25 +0800
Subject: [PATCH] [Feature] Add py150 and maxmin (#562)

* [feat] add clozeTesst_maxmin dataset

* [feat] add py150 datasets

* [feat] change __init__.py in opencompass/datasets

* [fix] pre-commit check

* [fix] rename py150 and masxmin datasets in configs

* [feat] add gen.py of py150 and maxmin in configs/datasets
---
 .../clozeTest_maxmin/clozeTest_maxmin_gen.py  |  4 ++
 .../clozeTest_maxmin_gen_c205fb.py            | 42 +++++++++++++++++++
 configs/datasets/py150/py150_gen.py           |  4 ++
 configs/datasets/py150/py150_gen_38b13d.py    | 41 ++++++++++++++++++
 opencompass/datasets/__init__.py              |  2 +
 opencompass/datasets/clozeTest_maxmin.py      | 35 ++++++++++++++++
 opencompass/datasets/py150.py                 | 38 +++++++++++++++++
 7 files changed, 166 insertions(+)
 create mode 100644 configs/datasets/clozeTest_maxmin/clozeTest_maxmin_gen.py
 create mode 100644 configs/datasets/clozeTest_maxmin/clozeTest_maxmin_gen_c205fb.py
 create mode 100644 configs/datasets/py150/py150_gen.py
 create mode 100644 configs/datasets/py150/py150_gen_38b13d.py
 create mode 100644 opencompass/datasets/clozeTest_maxmin.py
 create mode 100644 opencompass/datasets/py150.py
diff --git a/configs/datasets/clozeTest_maxmin/clozeTest_maxmin_gen.py b/configs/datasets/clozeTest_maxmin/clozeTest_maxmin_gen.py
new file mode 100644
index 000000000..eab463da5
--- /dev/null
+++ b/configs/datasets/clozeTest_maxmin/clozeTest_maxmin_gen.py
@@ -0,0 +1,4 @@
+from mmengine.config import read_base
+
+with read_base():
+    from .clozeTest_maxmin_gen_c205fb import maxmin_datasets  # noqa: F401, F403
\ No newline at end of file
diff --git a/configs/datasets/clozeTest_maxmin/clozeTest_maxmin_gen_c205fb.py b/configs/datasets/clozeTest_maxmin/clozeTest_maxmin_gen_c205fb.py
new file mode 100644
index 000000000..d77e85942
--- /dev/null
+++ b/configs/datasets/clozeTest_maxmin/clozeTest_maxmin_gen_c205fb.py
@@ -0,0 +1,42 @@
+from opencompass.openicl.icl_prompt_template import PromptTemplate
+from opencompass.openicl.icl_retriever import ZeroRetriever
+from opencompass.openicl.icl_inferencer import GenInferencer
+from opencompass.openicl.icl_evaluator import AccEvaluator
+from opencompass.datasets import MaxminDataset
+from opencompass.utils.text_postprocessors import first_capital_postprocess
+
+
+maxmin_reader_cfg = dict(
+    input_columns=["nl_tokens", "pl_tokens"],
+    output_column="answer",
+)
+
+maxmin_infer_cfg = dict(
+    prompt_template=dict(
+        type=PromptTemplate,
+        template=dict(
+            round=[
+                dict(role="HUMAN", prompt="Code:{pl_tokens}\nThe aim of the code: {nl_tokens}\nQuestion: Please tell me what \"<mask>\" in the code should be replaced with and you must response to me only A or B.\nA. max\nB. min\nAnswer:"),
+                dict(role="BOT", prompt="{answer}"),
+            ]
+        ),
+    ),
+    retriever=dict(type=ZeroRetriever),
+    inferencer=dict(type=GenInferencer),
+)
+
+maxmin_eval_cfg = dict(evaluator=dict(type=AccEvaluator),
+                        pred_role="BOT",
+                        pred_postprocessor=dict(type=first_capital_postprocess))
+
+maxmin_datasets = [
+    dict(
+        type=MaxminDataset,
+        abbr=f"maxmin",
+        test_path=f"data/clozeTest-maxmin/python/clozeTest.json",
+        answer_path=f"data/clozeTest-maxmin/python/answers.txt",
+        reader_cfg=maxmin_reader_cfg,
+        infer_cfg=maxmin_infer_cfg,
+        eval_cfg=maxmin_eval_cfg,
+    )
+]
\ No newline at end of file
diff --git a/configs/datasets/py150/py150_gen.py b/configs/datasets/py150/py150_gen.py
new file mode 100644
index 000000000..68bb3b11d
--- /dev/null
+++ b/configs/datasets/py150/py150_gen.py
@@ -0,0 +1,4 @@
+from mmengine.config import read_base
+
+with read_base():
+    from .py150_gen_38b13d import py150_datasets  # noqa: F401, F403
\ No newline at end of file
diff --git a/configs/datasets/py150/py150_gen_38b13d.py b/configs/datasets/py150/py150_gen_38b13d.py
new file mode 100644
index 000000000..ca62043ab
--- /dev/null
+++ b/configs/datasets/py150/py150_gen_38b13d.py
@@ -0,0 +1,41 @@
+from opencompass.openicl.icl_prompt_template import PromptTemplate
+from opencompass.openicl.icl_retriever import ZeroRetriever
+from opencompass.openicl.icl_inferencer import GenInferencer
+from opencompass.openicl.icl_evaluator import BleuEvaluator
+from opencompass.datasets import Py150Dataset
+from opencompass.utils.text_postprocessors import first_capital_postprocess
+
+
+py150_reader_cfg = dict(
+    input_columns="input",
+    output_column="gt",
+)
+
+py150_infer_cfg = dict(
+    prompt_template=dict(
+        type=PromptTemplate,
+        template=dict(
+            round=[
+                dict(role="HUMAN", prompt="I will give you a part of python code. Please write down what the next line of code is. Note that you only need to give the next line of code, and you don't need to give any other reply.\nCode:{input}\nNext line:"),
+                dict(role="BOT", prompt="{gt}"),
+            ]
+        ),
+    ),
+    retriever=dict(type=ZeroRetriever),
+    inferencer=dict(type=GenInferencer),
+)
+
+py150_eval_cfg = dict(evaluator=dict(type=BleuEvaluator),
+                        pred_role="BOT"
+                    )
+
+py150_datasets = [
+    dict(
+        type=Py150Dataset,
+        abbr=f"py150",
+        path=f"data/py150/test.json",
+        reader_cfg=py150_reader_cfg,
+        infer_cfg=py150_infer_cfg,
+        eval_cfg=py150_eval_cfg,
+    )
+]
\ No newline at end of file
diff --git a/opencompass/datasets/__init__.py b/opencompass/datasets/__init__.py
index 7049cb678..a419e3658 100644
--- a/opencompass/datasets/__init__.py
+++ b/opencompass/datasets/__init__.py
@@ -14,6 +14,7 @@
 from .chid import *  # noqa: F401, F403
 from .cibench import *  # noqa: F401, F403
 from .civilcomments import *  # noqa: F401, F403
+from .clozeTest_maxmin import *  # noqa: F401, F403
 from .cluewsc import *  # noqa: F401, F403
 from .cmb import *  # noqa: F401, F403
 from .cmmlu import *  # noqa: F401, F403
@@ -55,6 +56,7 @@
 from .natural_question import *  # noqa: F401, F403
 from .obqa import *  # noqa: F401, F403
 from .piqa import *  # noqa: F401, F403
+from .py150 import *  # noqa: F401, F403
 from .qasper import *  # noqa: F401, F403
 from .qaspercut import *  # noqa: F401, F403
 from .race import *  # noqa: F401, F403
diff --git a/opencompass/datasets/clozeTest_maxmin.py b/opencompass/datasets/clozeTest_maxmin.py
new file mode 100644
index 000000000..93288bf21
--- /dev/null
+++ b/opencompass/datasets/clozeTest_maxmin.py
@@ -0,0 +1,35 @@
+import json
+
+from datasets import Dataset
+
+from opencompass.registry import LOAD_DATASET
+
+from .base import BaseDataset
+
+
+@LOAD_DATASET.register_module()
+class MaxminDataset(BaseDataset):
+
+    @staticmethod
+    def load(test_path, answer_path=None):
+        if answer_path is not None:
+            with open(answer_path, 'r', encoding='utf-8') as answer_f:
+                answers = {}
+                for line in answer_f.readlines():
+                    line = line.strip()
+                    answers[line.split('<CODESPLIT>')[0]] = line.split(
+                        '<CODESPLIT>')[1]
+        datasets = []
+        with open(test_path, 'r') as test_f:
+            test_data = json.load(test_f)
+            for item in test_data:
+                dataset = dict()
+                dataset['nl_tokens'] = ' '.join(item['nl_tokens'])
+                dataset['pl_tokens'] = ' '.join(item['pl_tokens'])
+                if answer_path is not None:
+                    dataset['answer'] = 'A' if answers[
+                        item['idx']] == 'max' else 'B'
+                else:
+                    dataset['answer'] = ''
+                datasets.append(dataset)
+        return Dataset.from_list(datasets)
diff --git a/opencompass/datasets/py150.py b/opencompass/datasets/py150.py
new file mode 100644
index 000000000..d478357d8
--- /dev/null
+++ b/opencompass/datasets/py150.py
@@ -0,0 +1,38 @@
+import json
+import re
+
+from datasets import Dataset
+
+from opencompass.registry import LOAD_DATASET
+
+from .base import BaseDataset
+
+
+def py150_post_process(code):
+    code = code.replace('<NUM_LIT>',
+                        '0').replace('<STR_LIT>',
+                                     '').replace('<CHAR_LIT>', '')
+    pattern = re.compile(r'<(STR|NUM|CHAR)_LIT:(.*?)>', re.S)
+    lit_s = re.findall(pattern, code)
+    for lit in lit_s:
+        code = code.replace(f'<{lit[0]}_LIT:{lit[1]}>', lit[1])
+    code = json.loads(code)
+    code['input'] = code['input'].replace('<s>', '').split('<EOL>')
+    for code_line in code['input']:
+        code_line = code_line.strip()
+    code['input'] = '\n'.join(code['input'])
+    code.pop('id', None)
+    return code
+
+
+@LOAD_DATASET.register_module()
+class Py150Dataset(BaseDataset):
+
+    @staticmethod
+    def load(path):
+        lines = open(path, 'r').readlines()
+        rows = []
+        for line in lines:
+            row = py150_post_process(line)
+            rows.append(row)
+        return Dataset.from_list(rows)