Skip to content

Commit 3216dc0

Browse files
adding tests for class_eval
1 parent 1812344 commit 3216dc0

File tree

3 files changed

+29
-26
lines changed

3 files changed

+29
-26
lines changed

src/inspect_evals/class_eval/class_eval.py

Lines changed: 1 addition & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -31,10 +31,6 @@
3131
)
3232
from inspect_ai.util import ExecResult, sandbox
3333

34-
35-
import importlib
36-
import unittest
37-
3834
from utils import InferenceUtil, ModelName, GenerationStrategy, construct_prompt
3935

4036

@@ -89,12 +85,8 @@ def class_eval_scorer() -> Scorer:
8985
async def score(state:TaskState, target: Target) -> Score:
9086

9187
result = {}
92-
test_code = state.metadata["class_name"] + str(state.metadata["task_id"])
93-
88+
9489
generated_code = find_code(state.output.completion)
95-
96-
#test_classes = state.metadata["test_classes"]
97-
9890
code = generated_code + "\n" + state.metadata["test"]
9991

10092
explanation = ""
@@ -161,10 +153,3 @@ def record_to_sample(
161153
"fields": record["fields"],
162154
}
163155
)
164-
165-
166-
def sample_to_fewshot(sample: Sample) -> str:
167-
metadata = sample.metadata
168-
return (
169-
f"{metadata['class_description']}\n"
170-
)

src/inspect_evals/class_eval/test.py

Lines changed: 20 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,20 @@
11
import unittest
2+
from inspect_ai.solver import (
3+
generate,
4+
system_message
5+
)
26

37
from utils import construct_prompt
4-
from class_eval import record_to_sample, find_code
8+
from class_eval import record_to_sample, find_code, class_eval
59

6-
from test_data import record, sample, prompt, sample_code, raw_code
10+
from test_data import (
11+
record,
12+
sample,
13+
prompt,
14+
sample_code,
15+
raw_code,
16+
INSTRUCTION
17+
)
718

819
class TestClassEval(unittest.TestCase):
920

@@ -13,14 +24,14 @@ def test_record_to_sample(self):
1324
def test_find_code(self):
1425
self.assertEqual(find_code(raw_code), sample_code)
1526

27+
def test_task(self):
28+
task = class_eval(k_shot = 5)
29+
self.assertEqual(task.dataset.name, 'FudanSELab/ClassEval')
30+
self.assertEqual(task.epochs, 5)
31+
self.assertEqual(task.sandbox.type, "docker")
32+
33+
1634
class TestUtils(unittest.TestCase):
1735

1836
def test_construct_prompt(self):
1937
self.assertEqual(construct_prompt(record), prompt)
20-
21-
22-
# if __name__ == '__main__':
23-
24-
# #Save record to file
25-
# with open('test_data2.py', 'w') as f:
26-
# f.write(f'{record_to_sample(record)}')

src/inspect_evals/class_eval/test_data.py

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -76,4 +76,11 @@ def add(self, x, y):
7676
Test text
7777
"""
7878

79-
sample_code = r"""print("Hello, World!")"""
79+
sample_code = r"""print("Hello, World!")"""
80+
81+
82+
INSTRUCTION = """
83+
84+
You are an expert Python programmer. You will be given a task, and the tests that your code must pass.
85+
86+
"""

0 commit comments

Comments
 (0)