summaryrefslogtreecommitdiff
path: root/yaksh/evaluator_tests/test_python_evaluation.py
diff options
context:
space:
mode:
Diffstat (limited to 'yaksh/evaluator_tests/test_python_evaluation.py')
-rw-r--r--yaksh/evaluator_tests/test_python_evaluation.py687
1 files changed, 566 insertions, 121 deletions
diff --git a/yaksh/evaluator_tests/test_python_evaluation.py b/yaksh/evaluator_tests/test_python_evaluation.py
index acf5d0a..43cd0ea 100644
--- a/yaksh/evaluator_tests/test_python_evaluation.py
+++ b/yaksh/evaluator_tests/test_python_evaluation.py
@@ -6,25 +6,27 @@ import shutil
from textwrap import dedent
# Local import
+from yaksh.code_evaluator import CodeEvaluator
from yaksh.python_assertion_evaluator import PythonAssertionEvaluator
from yaksh.python_stdio_evaluator import PythonStdioEvaluator
from yaksh.settings import SERVER_TIMEOUT
-
class PythonAssertionEvaluationTestCases(unittest.TestCase):
def setUp(self):
with open('/tmp/test.txt', 'wb') as f:
f.write('2'.encode('ascii'))
tmp_in_dir_path = tempfile.mkdtemp()
self.in_dir = tmp_in_dir_path
- self.test_case_data = [{"test_case": 'assert(add(1,2)==3)', 'weight': 0.0},
- {"test_case": 'assert(add(-1,2)==1)', 'weight': 0.0},
- {"test_case": 'assert(add(-1,-2)==-3)', 'weight': 0.0},
+ self.test_case_data = [{"test_case_type": "standardtestcase", "test_case": 'assert(add(1,2)==3)', 'weight': 0.0},
+ {"test_case_type": "standardtestcase", "test_case": 'assert(add(-1,2)==1)', 'weight': 0.0},
+ {"test_case_type": "standardtestcase", "test_case": 'assert(add(-1,-2)==-3)', 'weight': 0.0},
]
self.timeout_msg = ("Code took more than {0} seconds to run. "
"You probably have an infinite loop in"
" your code.").format(SERVER_TIMEOUT)
self.file_paths = None
+ self.language = 'python'
+ self.test_case_type = 'standardtestcase'
def tearDown(self):
os.remove('/tmp/test.txt')
@@ -33,15 +35,24 @@ class PythonAssertionEvaluationTestCases(unittest.TestCase):
def test_correct_answer(self):
# Given
user_answer = "def add(a,b):\n\treturn a + b"
- kwargs = {'user_answer': user_answer,
- 'test_case_data': self.test_case_data,
- 'file_paths': self.file_paths,
- 'partial_grading': False
+ # kwargs = {'user_answer': user_answer,
+ # 'test_case_data': self.test_case_data,
+ # 'file_paths': self.file_paths,
+ # 'partial_grading': False,
+ # }
+ kwargs = {
+ 'metadata': {
+ 'user_answer': user_answer,
+ 'file_paths': self.file_paths,
+ 'partial_grading': False,
+ 'language': 'python'
+ },
+ 'test_case_data': self.test_case_data,
}
# When
- evaluator = PythonAssertionEvaluator()
- result = evaluator.evaluate(**kwargs)
+ evaluator = CodeEvaluator(self.in_dir)
+ result = evaluator.evaluate(kwargs)
# Then
self.assertTrue(result.get('success'))
@@ -50,15 +61,20 @@ class PythonAssertionEvaluationTestCases(unittest.TestCase):
def test_incorrect_answer(self):
# Given
user_answer = "def add(a,b):\n\treturn a - b"
- kwargs = {'user_answer': user_answer,
- 'test_case_data': self.test_case_data,
- 'file_paths': self.file_paths,
- 'partial_grading': False
+ kwargs = {
+ 'metadata': {
+ 'user_answer': user_answer,
+ 'file_paths': self.file_paths,
+ 'partial_grading': False,
+ 'language': 'python'
+ },
+ 'test_case_data': self.test_case_data,
}
# When
- evaluator = PythonAssertionEvaluator()
- result = evaluator.evaluate(**kwargs)
+ # evaluator = PythonAssertionEvaluator()
+ evaluator = CodeEvaluator(self.in_dir)
+ result = evaluator.evaluate(kwargs)
# Then
self.assertFalse(result.get('success'))
@@ -72,111 +88,6 @@ class PythonAssertionEvaluationTestCases(unittest.TestCase):
result.get('error')
)
- def test_partial_incorrect_answer(self):
- # Given
- user_answer = "def add(a,b):\n\treturn abs(a) + abs(b)"
- test_case_data = [{"test_case": 'assert(add(-1,2)==1)', 'weight': 1.0},
- {"test_case": 'assert(add(-1,-2)==-3)', 'weight': 1.0},
- {"test_case": 'assert(add(1,2)==3)', 'weight': 2.0}
- ]
- kwargs = {'user_answer': user_answer,
- 'test_case_data': test_case_data,
- 'file_paths': self.file_paths,
- 'partial_grading': True
- }
-
- # When
- evaluator = PythonAssertionEvaluator()
- result = evaluator.evaluate(**kwargs)
-
- # Then
- self.assertFalse(result.get('success'))
- self.assertEqual(result.get('weight'), 2.0)
- self.assertIn('AssertionError in: assert(add(-1,2)==1)',
- result.get('error')
- )
- self.assertIn('AssertionError in: assert(add(-1,-2)==-3)',
- result.get('error')
- )
-
- def test_infinite_loop(self):
- # Given
- user_answer = "def add(a, b):\n\twhile True:\n\t\tpass"
- kwargs = {'user_answer': user_answer,
- 'test_case_data': self.test_case_data,
- 'file_paths': self.file_paths,
- 'partial_grading': False
- }
-
- # When
- evaluator = PythonAssertionEvaluator()
- result = evaluator.evaluate(**kwargs)
-
- # Then
- self.assertFalse(result.get('success'))
- self.assertEqual(result.get('error'), self.timeout_msg)
-
- def test_syntax_error(self):
- # Given
- user_answer = dedent("""
- def add(a, b);
- return a + b
- """)
- syntax_error_msg = ["Traceback",
- "call",
- "File",
- "line",
- "<string>",
- "SyntaxError",
- "invalid syntax"
- ]
- kwargs = {'user_answer': user_answer,
- 'test_case_data': self.test_case_data,
- 'file_paths': self.file_paths,
- 'partial_grading': False
- }
-
- # When
- evaluator = PythonAssertionEvaluator()
- result = evaluator.evaluate(**kwargs)
- err = result.get("error").splitlines()
-
- # Then
- self.assertFalse(result.get("success"))
- self.assertEqual(5, len(err))
- for msg in syntax_error_msg:
- self.assertIn(msg, result.get("error"))
-
- def test_indent_error(self):
- # Given
- user_answer = dedent("""
- def add(a, b):
- return a + b
- """)
- indent_error_msg = ["Traceback", "call",
- "File",
- "line",
- "<string>",
- "IndentationError",
- "indented block"
- ]
- kwargs = {'user_answer': user_answer,
- 'test_case_data': self.test_case_data,
- 'file_paths': self.file_paths,
- 'partial_grading': False
-
- }
-
- # When
- evaluator = PythonAssertionEvaluator()
- result = evaluator.evaluate(**kwargs)
- err = result.get("error").splitlines()
-
- # Then
- self.assertFalse(result.get("success"))
- self.assertEqual(5, len(err))
- for msg in indent_error_msg:
- self.assertIn(msg, result.get("error"))
def test_name_error(self):
# Given
@@ -542,5 +453,539 @@ class PythonStdIOEvaluationTestCases(unittest.TestCase):
self.assertEqual(result.get('error'), timeout_msg)
self.assertFalse(result.get('success'))
+# class PythonAssertionEvaluationTestCases(unittest.TestCase):
+# def setUp(self):
+# with open('/tmp/test.txt', 'wb') as f:
+# f.write('2'.encode('ascii'))
+# tmp_in_dir_path = tempfile.mkdtemp()
+# self.in_dir = tmp_in_dir_path
+# self.test_case_data = [{"test_case": 'assert(add(1,2)==3)', 'weight': 0.0},
+# {"test_case": 'assert(add(-1,2)==1)', 'weight': 0.0},
+# {"test_case": 'assert(add(-1,-2)==-3)', 'weight': 0.0},
+# ]
+# self.timeout_msg = ("Code took more than {0} seconds to run. "
+# "You probably have an infinite loop in"
+# " your code.").format(SERVER_TIMEOUT)
+# self.file_paths = None
+
+# def tearDown(self):
+# os.remove('/tmp/test.txt')
+# shutil.rmtree(self.in_dir)
+
+# def test_correct_answer(self):
+# # Given
+# user_answer = "def add(a,b):\n\treturn a + b"
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+
+# # Then
+# self.assertTrue(result.get('success'))
+# self.assertIn("Correct answer", result.get('error'))
+
+# def test_incorrect_answer(self):
+# # Given
+# user_answer = "def add(a,b):\n\treturn a - b"
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+
+# # Then
+# self.assertFalse(result.get('success'))
+# self.assertIn('AssertionError in: assert(add(1,2)==3)',
+# result.get('error')
+# )
+# self.assertIn('AssertionError in: assert(add(-1,2)==1)',
+# result.get('error')
+# )
+# self.assertIn('AssertionError in: assert(add(-1,-2)==-3)',
+# result.get('error')
+# )
+
+# def test_partial_incorrect_answer(self):
+# # Given
+# user_answer = "def add(a,b):\n\treturn abs(a) + abs(b)"
+# test_case_data = [{"test_case": 'assert(add(-1,2)==1)', 'weight': 1.0},
+# {"test_case": 'assert(add(-1,-2)==-3)', 'weight': 1.0},
+# {"test_case": 'assert(add(1,2)==3)', 'weight': 2.0}
+# ]
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': True
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+
+# # Then
+# self.assertFalse(result.get('success'))
+# self.assertEqual(result.get('weight'), 2.0)
+# self.assertIn('AssertionError in: assert(add(-1,2)==1)',
+# result.get('error')
+# )
+# self.assertIn('AssertionError in: assert(add(-1,-2)==-3)',
+# result.get('error')
+# )
+
+# def test_infinite_loop(self):
+# # Given
+# user_answer = "def add(a, b):\n\twhile True:\n\t\tpass"
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+
+# # Then
+# self.assertFalse(result.get('success'))
+# self.assertEqual(result.get('error'), self.timeout_msg)
+
+# def test_syntax_error(self):
+# # Given
+# user_answer = dedent("""
+# def add(a, b);
+# return a + b
+# """)
+# syntax_error_msg = ["Traceback",
+# "call",
+# "File",
+# "line",
+# "<string>",
+# "SyntaxError",
+# "invalid syntax"
+# ]
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+# err = result.get("error").splitlines()
+
+# # Then
+# self.assertFalse(result.get("success"))
+# self.assertEqual(5, len(err))
+# for msg in syntax_error_msg:
+# self.assertIn(msg, result.get("error"))
+
+# def test_indent_error(self):
+# # Given
+# user_answer = dedent("""
+# def add(a, b):
+# return a + b
+# """)
+# indent_error_msg = ["Traceback", "call",
+# "File",
+# "line",
+# "<string>",
+# "IndentationError",
+# "indented block"
+# ]
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+# err = result.get("error").splitlines()
+
+# # Then
+# self.assertFalse(result.get("success"))
+# self.assertEqual(5, len(err))
+# for msg in indent_error_msg:
+# self.assertIn(msg, result.get("error"))
+
+# def test_name_error(self):
+# # Given
+# user_answer = ""
+# name_error_msg = ["Traceback",
+# "call",
+# "NameError",
+# "name",
+# "defined"
+# ]
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+# err = result.get("error").splitlines()
+
+# # Then
+# self.assertFalse(result.get("success"))
+# self.assertEqual(3, len(err))
+# for msg in name_error_msg:
+# self.assertIn(msg, result.get("error"))
+
+# def test_recursion_error(self):
+# # Given
+# user_answer = dedent("""
+# def add(a, b):
+# return add(3, 3)
+# """)
+# recursion_error_msg = ["Traceback",
+# "call",
+# "maximum recursion depth exceeded"
+# ]
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+# err = result.get("error").splitlines()
+
+# # Then
+# self.assertFalse(result.get("success"))
+# for msg in recursion_error_msg:
+# self.assertIn(msg, result.get("error"))
+
+# def test_type_error(self):
+# # Given
+# user_answer = dedent("""
+# def add(a):
+# return a + b
+# """)
+# type_error_msg = ["Traceback",
+# "call",
+# "TypeError",
+# "argument"
+# ]
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+# err = result.get("error").splitlines()
+
+# # Then
+# self.assertFalse(result.get("success"))
+# self.assertEqual(3, len(err))
+# for msg in type_error_msg:
+# self.assertIn(msg, result.get("error"))
+
+# def test_value_error(self):
+# # Given
+# user_answer = dedent("""
+# def add(a, b):
+# c = 'a'
+# return int(a) + int(b) + int(c)
+# """)
+# value_error_msg = ["Traceback",
+# "call",
+# "ValueError",
+# "invalid literal",
+# "base"
+# ]
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+# err = result.get("error").splitlines()
+
+# # Then
+# self.assertFalse(result.get("success"))
+# self.assertEqual(4, len(err))
+# for msg in value_error_msg:
+# self.assertIn(msg, result.get("error"))
+
+# def test_file_based_assert(self):
+# # Given
+# self.test_case_data = [{"test_case": "assert(ans()=='2')", "weight": 0.0}]
+# self.file_paths = [('/tmp/test.txt', False)]
+# user_answer = dedent("""
+# def ans():
+# with open("test.txt") as f:
+# return f.read()[0]
+# """)
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+
+# # Then
+# self.assertIn("Correct answer", result.get('error'))
+# self.assertTrue(result.get('success'))
+
+# def test_single_testcase_error(self):
+# # Given
+# """ Tests the user answer with just an incorrect test case """
+
+# user_answer = "def palindrome(a):\n\treturn a == a[::-1]"
+# test_case_data = [{"test_case": 's="abbb"\nasert palindrome(s)==False',
+# "weight": 0.0
+# }
+# ]
+# syntax_error_msg = ["Traceback",
+# "call",
+# "File",
+# "line",
+# "<string>",
+# "SyntaxError",
+# "invalid syntax"
+# ]
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+# err = result.get("error").splitlines()
+
+# # Then
+# self.assertFalse(result.get("success"))
+# self.assertEqual(5, len(err))
+# for msg in syntax_error_msg:
+# self.assertIn(msg, result.get("error"))
+
+
+# def test_multiple_testcase_error(self):
+# """ Tests the user answer with an correct test case
+# first and then with an incorrect test case """
+# # Given
+# user_answer = "def palindrome(a):\n\treturn a == a[::-1]"
+# test_case_data = [{"test_case": 'assert(palindrome("abba")==True)',
+# "weight": 0.0
+# },
+# {"test_case": 's="abbb"\nassert palindrome(S)==False',
+# "weight": 0.0
+# }
+# ]
+# name_error_msg = ["Traceback",
+# "call",
+# "File",
+# "line",
+# "<string>",
+# "NameError",
+# "name 'S' is not defined"
+# ]
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonAssertionEvaluator()
+# result = evaluator.evaluate(**kwargs)
+# err = result.get("error").splitlines()
+
+# # Then
+# self.assertFalse(result.get("success"))
+# self.assertEqual(3, len(err))
+# for msg in name_error_msg:
+# self.assertIn(msg, result.get("error"))
+
+
+# class PythonStdIOEvaluationTestCases(unittest.TestCase):
+# def setUp(self):
+# with open('/tmp/test.txt', 'wb') as f:
+# f.write('2'.encode('ascii'))
+# self.file_paths = None
+
+# def test_correct_answer_integer(self):
+# # Given
+# self.test_case_data = [{"expected_input": "1\n2",
+# "expected_output": "3",
+# "weight": 0.0
+# }]
+# user_answer = dedent("""
+# a = int(input())
+# b = int(input())
+# print(a+b)
+# """
+# )
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonStdioEvaluator()
+# result = evaluator.evaluate(**kwargs)
+
+# # Then
+# self.assertTrue(result.get('success'))
+# self.assertIn("Correct answer", result.get('error'))
+
+# def test_correct_answer_list(self):
+# # Given
+# self.test_case_data = [{"expected_input": "1,2,3\n5,6,7",
+# "expected_output": "[1, 2, 3, 5, 6, 7]",
+# "weight": 0.0
+# }]
+# user_answer = dedent("""
+# from six.moves import input
+# input_a = input()
+# input_b = input()
+# a = [int(i) for i in input_a.split(',')]
+# b = [int(i) for i in input_b.split(',')]
+# print(a+b)
+# """
+# )
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonStdioEvaluator()
+# result = evaluator.evaluate(**kwargs)
+
+# # Then
+# self.assertTrue(result.get('success'))
+# self.assertIn("Correct answer", result.get('error'))
+
+# def test_correct_answer_string(self):
+# # Given
+# self.test_case_data = [{"expected_input": ("the quick brown fox jumps over the lazy dog\nthe"),
+# "expected_output": "2",
+# "weight": 0.0
+# }]
+# user_answer = dedent("""
+# from six.moves import input
+# a = str(input())
+# b = str(input())
+# print(a.count(b))
+# """
+# )
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonStdioEvaluator()
+# result = evaluator.evaluate(**kwargs)
+
+# # Then
+# self.assertTrue(result.get('success'))
+# self.assertIn("Correct answer", result.get('error'))
+
+# def test_incorrect_answer_integer(self):
+# # Given
+# self.test_case_data = [{"expected_input": "1\n2",
+# "expected_output": "3",
+# "weight": 0.0
+# }]
+# user_answer = dedent("""
+# a = int(input())
+# b = int(input())
+# print(a-b)
+# """
+# )
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonStdioEvaluator()
+# result = evaluator.evaluate(**kwargs)
+
+# # Then
+# self.assertFalse(result.get('success'))
+# self.assertIn("Incorrect answer", result.get('error'))
+
+# def test_file_based_answer(self):
+# # Given
+# self.test_case_data = [{"expected_input": "",
+# "expected_output": "2",
+# "weight": 0.0
+# }]
+# self.file_paths = [('/tmp/test.txt', False)]
+
+# user_answer = dedent("""
+# with open("test.txt") as f:
+# a = f.read()
+# print(a[0])
+# """
+# )
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': self.test_case_data,
+# 'file_paths': self.file_paths,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonStdioEvaluator()
+# result = evaluator.evaluate(**kwargs)
+
+# # Then
+# self.assertEqual(result.get('error'), "Correct answer\n")
+# self.assertTrue(result.get('success'))
+
+# def test_infinite_loop(self):
+# # Given
+# test_case_data = [{"expected_input": "1\n2",
+# "expected_output": "3",
+# "weight": 0.0
+# }]
+# timeout_msg = ("Code took more than {0} seconds to run. "
+# "You probably have an infinite loop in"
+# " your code.").format(SERVER_TIMEOUT)
+# user_answer = "while True:\n\tpass"
+# kwargs = {'user_answer': user_answer,
+# 'test_case_data': test_case_data,
+# 'partial_grading': False
+# }
+
+# # When
+# evaluator = PythonStdioEvaluator()
+# result = evaluator.evaluate(**kwargs)
+
+# # Then
+# self.assertEqual(result.get('error'), timeout_msg)
+# self.assertFalse(result.get('success'))
+
if __name__ == '__main__':
unittest.main()