1
 2
 3
 4
 5
 6
 7
 8
 9
10
11
12
13
14
15
16
17
18
19
20
21
from evaluator import *

DESCRIPTION = "Test if the model can generate a python program that defines dataflow DSL."

TAGS = ['code', 'python']

question = """
Write a python class Const, Square, Print so that I can write, for example,

Cost(5) >> Square() >> Inc() >> Print()

and the resulting python program will print 26 to the screen.
"""

test_case, answer = make_python_test([("Const(2) >> Square() >> Inc() >> Square()", "25")])

TestMakeShiftOp = question >> LLMRun() >> ExtractCode() >> PythonRun() >> SubstringEvaluator(answer)


if __name__ == "__main__":
    print(run_test(TestMakeShiftOp))