aboutsummaryrefslogtreecommitdiffstats
path: root/backend/routes/forms/unittesting.py
diff options
context:
space:
mode:
Diffstat (limited to 'backend/routes/forms/unittesting.py')
-rw-r--r--backend/routes/forms/unittesting.py94
1 files changed, 59 insertions, 35 deletions
diff --git a/backend/routes/forms/unittesting.py b/backend/routes/forms/unittesting.py
index 2bfeaa9..1b042e4 100644
--- a/backend/routes/forms/unittesting.py
+++ b/backend/routes/forms/unittesting.py
@@ -13,6 +13,10 @@ with open("resources/unittest_template.py") as file:
TEST_TEMPLATE = file.read()
+class BypassDetectedError(Exception):
+ """Detected an attempt at bypassing the unittests."""
+
+
UnittestResult = namedtuple(
"UnittestResult", "question_id question_index return_code passed result"
)
@@ -65,9 +69,12 @@ async def _post_eval(code: str) -> dict[str, str]:
return response.json()
-async def execute_unittest(form_response: FormResponse, form: Form) -> list[UnittestResult]:
+async def execute_unittest(
+ form_response: FormResponse, form: Form
+) -> tuple[list[UnittestResult], list[BypassDetectedError]]:
"""Execute all the unittests in this form and return the results."""
unittest_results = []
+ errors = []
for index, question in enumerate(form.questions):
if question.type == "code":
@@ -101,40 +108,57 @@ async def execute_unittest(form_response: FormResponse, form: Form) -> list[Unit
code = code.replace("### UNIT CODE", unit_code)
try:
- response = await _post_eval(code)
- except HTTPStatusError:
- return_code = 99
- result = "Unable to contact code runner."
- else:
- return_code = int(response["returncode"])
-
- # Parse the stdout if the tests ran successfully
- if return_code == 0:
- stdout = response["stdout"]
- passed = bool(int(stdout[0]))
-
- # If the test failed, we have to populate the result string.
- if not passed:
- failed_tests = stdout[1:].strip().split(";")
-
- # Redact failed hidden tests
- for i, failed_test in enumerate(failed_tests.copy()):
- if failed_test in hidden_tests:
- failed_tests[i] = f"hidden_test_{hidden_tests[failed_test]}"
-
- result = ";".join(failed_tests)
- else:
- result = ""
- elif return_code in (5, 6, 99):
- result = response["stdout"]
- # Killed by NsJail
- elif return_code == 137:
- return_code = 7
- result = "Timed out or ran out of memory."
- # Another code has been returned by CPython because of another failure.
- else:
+ try:
+ response = await _post_eval(code)
+ except HTTPStatusError:
return_code = 99
- result = "Internal error."
+ result = "Unable to contact code runner."
+ else:
+ return_code = int(response["returncode"])
+
+ # Parse the stdout if the tests ran successfully
+ if return_code == 0:
+ stdout = response["stdout"]
+ try:
+ passed = bool(int(stdout[0]))
+ except ValueError:
+ raise BypassDetectedError("Detected a bypass when reading result code.")
+
+ if passed and stdout.strip() != "1":
+ # Most likely a bypass attempt
+ # A 1 was written to stdout to indicate success,
+ # followed by the actual output
+ raise BypassDetectedError(
+ "Detected improper value for stdout in unittest."
+ )
+
+ # If the test failed, we have to populate the result string.
+ elif not passed:
+ failed_tests = stdout[1:].strip().split(";")
+
+ # Redact failed hidden tests
+ for i, failed_test in enumerate(failed_tests.copy()):
+ if failed_test in hidden_tests:
+ failed_tests[i] = f"hidden_test_{hidden_tests[failed_test]}"
+
+ result = ";".join(failed_tests)
+ else:
+ result = ""
+ elif return_code in (5, 6, 99):
+ result = response["stdout"]
+ # Killed by NsJail
+ elif return_code == 137:
+ return_code = 7
+ result = "Timed out or ran out of memory."
+ # Another code has been returned by CPython because of another failure.
+ else:
+ return_code = 99
+ result = "Internal error."
+ except BypassDetectedError as error:
+ return_code = 10
+ result = "Bypass attempt detected, aborting."
+ errors.append(error)
+ passed = False
unittest_results.append(UnittestResult(
question_id=question.id,
@@ -144,4 +168,4 @@ async def execute_unittest(form_response: FormResponse, form: Form) -> list[Unit
result=result
))
- return unittest_results
+ return unittest_results, errors