Spaces:
Running
Running
add a reliability guard
Browse files- testing_util.py +85 -0
testing_util.py
CHANGED
|
@@ -1,6 +1,7 @@
|
|
| 1 |
import json
|
| 2 |
import sys
|
| 3 |
import faulthandler
|
|
|
|
| 4 |
|
| 5 |
# used for debugging to time steps
|
| 6 |
from datetime import datetime
|
|
@@ -52,6 +53,9 @@ def run_test(sample, test=None, debug=False):
|
|
| 52 |
if test(generated_code) is not None it'll try to run the code.
|
| 53 |
otherwise it'll just return an input and output pair.
|
| 54 |
"""
|
|
|
|
|
|
|
|
|
|
| 55 |
if debug:
|
| 56 |
print(f"start = {datetime.now().time()}")
|
| 57 |
|
|
@@ -436,3 +440,84 @@ def call_method(method, inputs):
|
|
| 436 |
pass
|
| 437 |
return _inner_call_method(method)
|
| 438 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
import json
|
| 2 |
import sys
|
| 3 |
import faulthandler
|
| 4 |
+
import platform
|
| 5 |
|
| 6 |
# used for debugging to time steps
|
| 7 |
from datetime import datetime
|
|
|
|
| 53 |
if test(generated_code) is not None it'll try to run the code.
|
| 54 |
otherwise it'll just return an input and output pair.
|
| 55 |
"""
|
| 56 |
+
# Disable functionalities that can make destructive changes to the test.
|
| 57 |
+
reliability_guard()
|
| 58 |
+
|
| 59 |
if debug:
|
| 60 |
print(f"start = {datetime.now().time()}")
|
| 61 |
|
|
|
|
| 440 |
pass
|
| 441 |
return _inner_call_method(method)
|
| 442 |
|
| 443 |
+
|
| 444 |
+
|
| 445 |
+
|
| 446 |
+
def reliability_guard(maximum_memory_bytes=None):
|
| 447 |
+
"""
|
| 448 |
+
This disables various destructive functions and prevents the generated code
|
| 449 |
+
from interfering with the test (e.g. fork bomb, killing other processes,
|
| 450 |
+
removing filesystem files, etc.)
|
| 451 |
+
WARNING
|
| 452 |
+
This function is NOT a security sandbox. Untrusted code, including, model-
|
| 453 |
+
generated code, should not be blindly executed outside of one. See the
|
| 454 |
+
Codex paper for more information about OpenAI's code sandbox, and proceed
|
| 455 |
+
with caution.
|
| 456 |
+
"""
|
| 457 |
+
|
| 458 |
+
if maximum_memory_bytes is not None:
|
| 459 |
+
import resource
|
| 460 |
+
|
| 461 |
+
resource.setrlimit(resource.RLIMIT_AS, (maximum_memory_bytes, maximum_memory_bytes))
|
| 462 |
+
resource.setrlimit(resource.RLIMIT_DATA, (maximum_memory_bytes, maximum_memory_bytes))
|
| 463 |
+
if not platform.uname().system == "Darwin":
|
| 464 |
+
resource.setrlimit(resource.RLIMIT_STACK, (maximum_memory_bytes, maximum_memory_bytes))
|
| 465 |
+
|
| 466 |
+
faulthandler.disable()
|
| 467 |
+
|
| 468 |
+
import builtins
|
| 469 |
+
|
| 470 |
+
builtins.exit = None
|
| 471 |
+
builtins.quit = None
|
| 472 |
+
|
| 473 |
+
import os
|
| 474 |
+
|
| 475 |
+
os.environ["OMP_NUM_THREADS"] = "1"
|
| 476 |
+
|
| 477 |
+
os.kill = None
|
| 478 |
+
os.system = None
|
| 479 |
+
os.putenv = None
|
| 480 |
+
os.remove = None
|
| 481 |
+
os.removedirs = None
|
| 482 |
+
os.rmdir = None
|
| 483 |
+
os.fchdir = None
|
| 484 |
+
os.setuid = None
|
| 485 |
+
os.fork = None
|
| 486 |
+
os.forkpty = None
|
| 487 |
+
os.killpg = None
|
| 488 |
+
os.rename = None
|
| 489 |
+
os.renames = None
|
| 490 |
+
os.truncate = None
|
| 491 |
+
os.replace = None
|
| 492 |
+
os.unlink = None
|
| 493 |
+
os.fchmod = None
|
| 494 |
+
os.fchown = None
|
| 495 |
+
os.chmod = None
|
| 496 |
+
os.chown = None
|
| 497 |
+
os.chroot = None
|
| 498 |
+
os.fchdir = None
|
| 499 |
+
os.lchflags = None
|
| 500 |
+
os.lchmod = None
|
| 501 |
+
os.lchown = None
|
| 502 |
+
os.getcwd = None
|
| 503 |
+
os.chdir = None
|
| 504 |
+
|
| 505 |
+
import shutil
|
| 506 |
+
|
| 507 |
+
shutil.rmtree = None
|
| 508 |
+
shutil.move = None
|
| 509 |
+
shutil.chown = None
|
| 510 |
+
|
| 511 |
+
import subprocess
|
| 512 |
+
|
| 513 |
+
subprocess.Popen = None # type: ignore
|
| 514 |
+
|
| 515 |
+
__builtins__["help"] = None
|
| 516 |
+
|
| 517 |
+
import sys
|
| 518 |
+
|
| 519 |
+
sys.modules["ipdb"] = None
|
| 520 |
+
sys.modules["joblib"] = None
|
| 521 |
+
sys.modules["resource"] = None
|
| 522 |
+
sys.modules["psutil"] = None
|
| 523 |
+
sys.modules["tkinter"] = None
|